dm-raid1.c revision 5339fc2d47d1d720e027b9b832bf5aae8fba2ac0
11da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*
21da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Copyright (C) 2003 Sistina Software Limited.
31f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen * Copyright (C) 2005-2008 Red Hat, Inc. All rights reserved.
41da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *
51da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * This file is released under the GPL.
61da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */
71da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow#include "dm-bio-record.h"
91da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/init.h>
111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/mempool.h>
121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/module.h>
131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/pagemap.h>
141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/slab.h>
151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/workqueue.h>
161f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen#include <linux/device-mapper.h>
17a765e20eeb423d0fa6a02ffab51141e53bbd93cbAlasdair G Kergon#include <linux/dm-io.h>
18a765e20eeb423d0fa6a02ffab51141e53bbd93cbAlasdair G Kergon#include <linux/dm-dirty-log.h>
19a765e20eeb423d0fa6a02ffab51141e53bbd93cbAlasdair G Kergon#include <linux/dm-kcopyd.h>
201f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen#include <linux/dm-region-hash.h>
211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
2272d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon#define DM_MSG_PREFIX "raid1"
231f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen
241f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen#define MAX_RECOVERY 1	/* Maximum number of regions recovered in parallel. */
2588be163abb5324bab09f5eff9646590eec5314ebMilan Broz#define DM_IO_PAGES 64
261f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen#define DM_KCOPYD_PAGES 64
2772d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon
28a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow#define DM_RAID1_HANDLE_ERRORS 0x01
29f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow#define errors_handled(p)	((p)->features & DM_RAID1_HANDLE_ERRORS)
30a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
3133184048dc4f9d5550d3b6a88c8e0ff92033eb6eJonathan E Brassowstatic DECLARE_WAIT_QUEUE_HEAD(_kmirrord_recovery_stopped);
321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*-----------------------------------------------------------------
34e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown * Mirror set structures.
35e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown *---------------------------------------------------------------*/
3672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowenum dm_raid1_error {
3772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	DM_RAID1_WRITE_ERROR,
3864b30c46e866bbff8a9e17883a18636adc358455Mikulas Patocka	DM_RAID1_FLUSH_ERROR,
3972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	DM_RAID1_SYNC_ERROR,
4072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	DM_RAID1_READ_ERROR
4172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow};
4272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
43e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brownstruct mirror {
44aa5617c55357d86c9082ba1d66fa9795370c9954Jonathan Brassow	struct mirror_set *ms;
45e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	atomic_t error_count;
4639ed7adb17bdec8224bd3fae551bb7222e05f35bAl Viro	unsigned long error_type;
47e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	struct dm_dev *dev;
48e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	sector_t offset;
49e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown};
50e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown
51e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brownstruct mirror_set {
52e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	struct dm_target *ti;
53e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	struct list_head list;
541f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen
55a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	uint64_t features;
56e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown
5772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	spinlock_t lock;	/* protects the lists */
58e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	struct bio_list reads;
59e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	struct bio_list writes;
6072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct bio_list failures;
6104788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	struct bio_list holds;	/* bios are waiting until suspend */
62e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown
631f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_region_hash *rh;
641f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_kcopyd_client *kcopyd_client;
6588be163abb5324bab09f5eff9646590eec5314ebMilan Broz	struct dm_io_client *io_client;
6606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	mempool_t *read_record_pool;
6788be163abb5324bab09f5eff9646590eec5314ebMilan Broz
68e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	/* recovery */
69e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	region_t nr_regions;
70e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	int in_sync;
71fc1ff9588a6d56258ff9576a31aa34f17757c666Jonathan Brassow	int log_failure;
72929be8fcb4b4b65d038e73d3bb34715851a95ca2Mikulas Patocka	int leg_failure;
73b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	atomic_t suspend;
74e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown
7572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	atomic_t default_mirror;	/* Default mirror */
76e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown
776ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	struct workqueue_struct *kmirrord_wq;
786ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	struct work_struct kmirrord_work;
79a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	struct timer_list timer;
80a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	unsigned long timer_pending;
81a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka
8272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct work_struct trigger_event;
836ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski
841f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	unsigned nr_mirrors;
85e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	struct mirror mirror[0];
86e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown};
87e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown
881f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagenstatic void wakeup_mirrord(void *context)
891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
901f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct mirror_set *ms = context;
911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
926ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	queue_work(ms->kmirrord_wq, &ms->kmirrord_work);
936ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski}
946ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski
95a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patockastatic void delayed_wake_fn(unsigned long data)
96a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka{
97a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	struct mirror_set *ms = (struct mirror_set *) data;
98a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka
99a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	clear_bit(0, &ms->timer_pending);
1001f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	wakeup_mirrord(ms);
101a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka}
102a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka
103a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patockastatic void delayed_wake(struct mirror_set *ms)
104a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka{
105a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	if (test_and_set_bit(0, &ms->timer_pending))
106a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka		return;
107a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka
108a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	ms->timer.expires = jiffies + HZ / 5;
109a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	ms->timer.data = (unsigned long) ms;
110a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	ms->timer.function = delayed_wake_fn;
111a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	add_timer(&ms->timer);
112a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka}
113a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka
1141f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagenstatic void wakeup_all_recovery_waiters(void *context)
1151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
1161f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	wake_up_all(&_kmirrord_recovery_stopped);
1171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
1181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1191f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagenstatic void queue_bio(struct mirror_set *ms, struct bio *bio, int rw)
1201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
1211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	unsigned long flags;
1221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int should_wake = 0;
1231f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct bio_list *bl;
1241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1251f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	bl = (rw == WRITE) ? &ms->writes : &ms->reads;
1261f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	spin_lock_irqsave(&ms->lock, flags);
1271f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	should_wake = !(bl->head);
1281f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	bio_list_add(bl, bio);
1291f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	spin_unlock_irqrestore(&ms->lock, flags);
1301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (should_wake)
1321f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		wakeup_mirrord(ms);
1331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
1341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1351f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagenstatic void dispatch_bios(void *context, struct bio_list *bio_list)
1361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
1371f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct mirror_set *ms = context;
1381f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct bio *bio;
1391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1401f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	while ((bio = bio_list_pop(bio_list)))
1411f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		queue_bio(ms, bio, WRITE);
1421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
1431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
14406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow#define MIN_READ_RECORDS 20
14506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstruct dm_raid1_read_record {
14606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct mirror *m;
14706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct dm_bio_details details;
14806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow};
14906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
15095f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patockastatic struct kmem_cache *_dm_raid1_read_record_cache;
15195f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka
1521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*
1531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Every mirror should look like this one.
1541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */
1551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#define DEFAULT_MIRROR 0
1561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*
15806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow * This is yucky.  We squirrel the mirror struct away inside
15906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow * bi_next for read/write buffers.  This is safe since the bh
1601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * doesn't get submitted to the lower levels of block layer.
1611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */
16206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic struct mirror *bio_get_m(struct bio *bio)
1631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
16406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	return (struct mirror *) bio->bi_next;
1651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
1661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
16706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic void bio_set_m(struct bio *bio, struct mirror *m)
1681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
16906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	bio->bi_next = (struct bio *) m;
1701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
1711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
17272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowstatic struct mirror *get_default_mirror(struct mirror_set *ms)
17372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow{
17472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	return &ms->mirror[atomic_read(&ms->default_mirror)];
17572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow}
17672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
17772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowstatic void set_default_mirror(struct mirror *m)
17872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow{
17972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct mirror_set *ms = m->ms;
18072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct mirror *m0 = &(ms->mirror[0]);
18172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
18272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	atomic_set(&ms->default_mirror, m - m0);
18372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow}
18472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
18587968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patockastatic struct mirror *get_valid_mirror(struct mirror_set *ms)
18687968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka{
18787968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka	struct mirror *m;
18887968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka
18987968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka	for (m = ms->mirror; m < ms->mirror + ms->nr_mirrors; m++)
19087968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka		if (!atomic_read(&m->error_count))
19187968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka			return m;
19287968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka
19387968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka	return NULL;
19487968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka}
19587968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka
19672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow/* fail_mirror
19772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * @m: mirror device to fail
19872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * @error_type: one of the enum's, DM_RAID1_*_ERROR
19972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow *
20072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * If errors are being handled, record the type of
20172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * error encountered for this device.  If this type
20272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * of error has already been recorded, we can return;
20372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * otherwise, we must signal userspace by triggering
20472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * an event.  Additionally, if the device is the
20572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * primary device, we must choose a new primary, but
20672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * only if the mirror is in-sync.
20772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow *
20872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * This function must not block.
20972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow */
21072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowstatic void fail_mirror(struct mirror *m, enum dm_raid1_error error_type)
21172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow{
21272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct mirror_set *ms = m->ms;
21372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct mirror *new;
21472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
215929be8fcb4b4b65d038e73d3bb34715851a95ca2Mikulas Patocka	ms->leg_failure = 1;
216929be8fcb4b4b65d038e73d3bb34715851a95ca2Mikulas Patocka
21772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	/*
21872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	 * error_count is used for nothing more than a
21972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	 * simple way to tell if a device has encountered
22072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	 * errors.
22172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	 */
22272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	atomic_inc(&m->error_count);
22372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
22472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	if (test_and_set_bit(error_type, &m->error_type))
22572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		return;
22672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
227d460c65a6a9ec9e0d284864ec3a9a2d1b73f0e43Jonathan Brassow	if (!errors_handled(ms))
228d460c65a6a9ec9e0d284864ec3a9a2d1b73f0e43Jonathan Brassow		return;
229d460c65a6a9ec9e0d284864ec3a9a2d1b73f0e43Jonathan Brassow
23072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	if (m != get_default_mirror(ms))
23172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		goto out;
23272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
23372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	if (!ms->in_sync) {
23472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		/*
23572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		 * Better to issue requests to same failing device
23672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		 * than to risk returning corrupt data.
23772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		 */
23872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		DMERR("Primary mirror (%s) failed while out-of-sync: "
23972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		      "Reads may fail.", m->dev->name);
24072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		goto out;
24172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	}
24272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
24387968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka	new = get_valid_mirror(ms);
24487968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka	if (new)
24587968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka		set_default_mirror(new);
24687968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka	else
24772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		DMWARN("All sides of mirror have failed.");
24872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
24972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowout:
25072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	schedule_work(&ms->trigger_event);
25172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow}
25272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
253c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patockastatic int mirror_flush(struct dm_target *ti)
254c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka{
255c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	struct mirror_set *ms = ti->private;
256c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	unsigned long error_bits;
257c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka
258c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	unsigned int i;
259c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	struct dm_io_region io[ms->nr_mirrors];
260c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	struct mirror *m;
261c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	struct dm_io_request io_req = {
262c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		.bi_rw = WRITE_BARRIER,
263c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		.mem.type = DM_IO_KMEM,
264c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		.mem.ptr.bvec = NULL,
265c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		.client = ms->io_client,
266c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	};
267c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka
268c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	for (i = 0, m = ms->mirror; i < ms->nr_mirrors; i++, m++) {
269c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		io[i].bdev = m->dev->bdev;
270c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		io[i].sector = 0;
271c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		io[i].count = 0;
272c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	}
273c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka
274c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	error_bits = -1;
275c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	dm_io(&io_req, ms->nr_mirrors, io, &error_bits);
276c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	if (unlikely(error_bits != 0)) {
277c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		for (i = 0; i < ms->nr_mirrors; i++)
278c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka			if (test_bit(i, &error_bits))
279c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka				fail_mirror(ms->mirror + i,
28064b30c46e866bbff8a9e17883a18636adc358455Mikulas Patocka					    DM_RAID1_FLUSH_ERROR);
281c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		return -EIO;
282c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	}
283c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka
284c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	return 0;
285c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka}
286c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka
2871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*-----------------------------------------------------------------
2881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Recovery.
2891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *
2901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * When a mirror is first activated we may find that some regions
2911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * are in the no-sync state.  We have to recover these by
2921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * recopying from the default mirror to all the others.
2931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/
2944cdc1d1fa5c5ac14dc21be19832f02fd0b83867eAlasdair G Kergonstatic void recovery_complete(int read_err, unsigned long write_err,
2951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			      void *context)
2961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
2971f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_region *reg = context;
2981f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct mirror_set *ms = dm_rh_region_context(reg);
2998f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow	int m, bit = 0;
3001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3018f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow	if (read_err) {
302f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow		/* Read error means the failure of default mirror. */
303f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow		DMERR_LIMIT("Unable to read primary mirror during recovery");
3048f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow		fail_mirror(get_default_mirror(ms), DM_RAID1_SYNC_ERROR);
3058f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow	}
306f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow
3078f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow	if (write_err) {
3084cdc1d1fa5c5ac14dc21be19832f02fd0b83867eAlasdair G Kergon		DMERR_LIMIT("Write error during recovery (error = 0x%lx)",
309f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow			    write_err);
3108f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow		/*
3118f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow		 * Bits correspond to devices (excluding default mirror).
3128f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow		 * The default mirror cannot change during recovery.
3138f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow		 */
3148f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow		for (m = 0; m < ms->nr_mirrors; m++) {
3158f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow			if (&ms->mirror[m] == get_default_mirror(ms))
3168f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow				continue;
3178f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow			if (test_bit(bit, &write_err))
3188f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow				fail_mirror(ms->mirror + m,
3198f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow					    DM_RAID1_SYNC_ERROR);
3208f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow			bit++;
3218f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow		}
3228f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow	}
323f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow
3241f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_rh_recovery_end(reg, !(read_err || write_err));
3251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
3261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3271f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagenstatic int recover(struct mirror_set *ms, struct dm_region *reg)
3281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
3291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int r;
3301f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	unsigned i;
331eb69aca5d3370b81450d68edeebc2bb9a3eb9689Heinz Mauelshagen	struct dm_io_region from, to[DM_KCOPYD_MAX_REGIONS], *dest;
3321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror *m;
3331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	unsigned long flags = 0;
3341f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	region_t key = dm_rh_get_region_key(reg);
3351f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	sector_t region_size = dm_rh_get_region_size(ms->rh);
3361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/* fill in the source */
33872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	m = get_default_mirror(ms);
3391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	from.bdev = m->dev->bdev;
3401f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	from.sector = m->offset + dm_rh_region_to_sector(ms->rh, key);
3411f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	if (key == (ms->nr_regions - 1)) {
3421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		/*
3431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		 * The final region may be smaller than
3441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		 * region_size.
3451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		 */
3461f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		from.count = ms->ti->len & (region_size - 1);
3471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		if (!from.count)
3481f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen			from.count = region_size;
3491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	} else
3501f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		from.count = region_size;
3511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/* fill in the destinations */
3531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	for (i = 0, dest = to; i < ms->nr_mirrors; i++) {
35472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		if (&ms->mirror[i] == get_default_mirror(ms))
3551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			continue;
3561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		m = ms->mirror + i;
3581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		dest->bdev = m->dev->bdev;
3591f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		dest->sector = m->offset + dm_rh_region_to_sector(ms->rh, key);
3601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		dest->count = from.count;
3611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		dest++;
3621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
3631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/* hand to kcopyd */
365f7c83e2e4783c4f7abe6f3a85a8c5e210f98bc7bJonathan Brassow	if (!errors_handled(ms))
366f7c83e2e4783c4f7abe6f3a85a8c5e210f98bc7bJonathan Brassow		set_bit(DM_KCOPYD_IGNORE_ERROR, &flags);
367f7c83e2e4783c4f7abe6f3a85a8c5e210f98bc7bJonathan Brassow
368eb69aca5d3370b81450d68edeebc2bb9a3eb9689Heinz Mauelshagen	r = dm_kcopyd_copy(ms->kcopyd_client, &from, ms->nr_mirrors - 1, to,
369eb69aca5d3370b81450d68edeebc2bb9a3eb9689Heinz Mauelshagen			   flags, recovery_complete, reg);
3701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	return r;
3721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
3731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3741da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void do_recovery(struct mirror_set *ms)
3751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
3761f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_region *reg;
3771f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
3781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int r;
3791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
3811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * Start quiescing some regions.
3821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
3831f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_rh_recovery_prepare(ms->rh);
3841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
3861da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * Copy any already quiesced regions.
3871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
3881f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	while ((reg = dm_rh_recovery_start(ms->rh))) {
3891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		r = recover(ms, reg);
3901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		if (r)
3911f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen			dm_rh_recovery_end(reg, 0);
3921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
3931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
3951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * Update the in sync flag.
3961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
3971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (!ms->in_sync &&
3981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	    (log->type->get_sync_count(log) == ms->nr_regions)) {
3991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		/* the sync is complete */
4001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		dm_table_event(ms->ti->table);
4011da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		ms->in_sync = 1;
4021da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
4031da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
4041da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
4051da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*-----------------------------------------------------------------
4061da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Reads
4071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/
4081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic struct mirror *choose_mirror(struct mirror_set *ms, sector_t sector)
4091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
41006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct mirror *m = get_default_mirror(ms);
41106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
41206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	do {
41306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		if (likely(!atomic_read(&m->error_count)))
41406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			return m;
41506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
41606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		if (m-- == ms->mirror)
41706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			m += ms->nr_mirrors;
41806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	} while (m != get_default_mirror(ms));
41906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
42006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	return NULL;
42106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow}
42206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
42306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic int default_ok(struct mirror *m)
42406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow{
42506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct mirror *default_mirror = get_default_mirror(m->ms);
42606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
42706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	return !atomic_read(&default_mirror->error_count);
42806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow}
42906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
43006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic int mirror_available(struct mirror_set *ms, struct bio *bio)
43106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow{
4321f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
4331f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	region_t region = dm_rh_bio_to_region(ms->rh, bio);
43406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
4351f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	if (log->type->in_sync(log, region, 0))
43606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		return choose_mirror(ms,  bio->bi_sector) ? 1 : 0;
43706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
43806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	return 0;
4391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
4401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
4411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*
4421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * remap a buffer to a particular mirror.
4431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */
44406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic sector_t map_sector(struct mirror *m, struct bio *bio)
44506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow{
4464184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka	if (unlikely(!bio->bi_size))
4474184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka		return 0;
44806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	return m->offset + (bio->bi_sector - m->ms->ti->begin);
44906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow}
45006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
45106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic void map_bio(struct mirror *m, struct bio *bio)
4521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
4531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	bio->bi_bdev = m->dev->bdev;
45406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	bio->bi_sector = map_sector(m, bio);
45506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow}
45606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
45722a1ceb1e6a7fbce95a1531ff10bb4fb036d4a37Heinz Mauelshagenstatic void map_region(struct dm_io_region *io, struct mirror *m,
45806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		       struct bio *bio)
45906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow{
46006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	io->bdev = m->dev->bdev;
46106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	io->sector = map_sector(m, bio);
46206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	io->count = bio->bi_size >> 9;
46306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow}
46406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
46504788507686d184d8166918b70ef52311bc36dcbMikulas Patockastatic void hold_bio(struct mirror_set *ms, struct bio *bio)
46604788507686d184d8166918b70ef52311bc36dcbMikulas Patocka{
46704788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	/*
46804788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 * If device is suspended, complete the bio.
46904788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 */
47004788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	if (atomic_read(&ms->suspend)) {
47104788507686d184d8166918b70ef52311bc36dcbMikulas Patocka		if (dm_noflush_suspending(ms->ti))
47204788507686d184d8166918b70ef52311bc36dcbMikulas Patocka			bio_endio(bio, DM_ENDIO_REQUEUE);
47304788507686d184d8166918b70ef52311bc36dcbMikulas Patocka		else
47404788507686d184d8166918b70ef52311bc36dcbMikulas Patocka			bio_endio(bio, -EIO);
47504788507686d184d8166918b70ef52311bc36dcbMikulas Patocka		return;
47604788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	}
47704788507686d184d8166918b70ef52311bc36dcbMikulas Patocka
47804788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	/*
47904788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 * Hold bio until the suspend is complete.
48004788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 */
48104788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	spin_lock_irq(&ms->lock);
48204788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	bio_list_add(&ms->holds, bio);
48304788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	spin_unlock_irq(&ms->lock);
48404788507686d184d8166918b70ef52311bc36dcbMikulas Patocka}
48504788507686d184d8166918b70ef52311bc36dcbMikulas Patocka
48606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow/*-----------------------------------------------------------------
48706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow * Reads
48806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow *---------------------------------------------------------------*/
48906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic void read_callback(unsigned long error, void *context)
49006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow{
49106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct bio *bio = context;
49206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct mirror *m;
49306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
49406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	m = bio_get_m(bio);
49506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	bio_set_m(bio, NULL);
49606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
49706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (likely(!error)) {
49806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		bio_endio(bio, 0);
49906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		return;
50006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	}
50106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
50206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	fail_mirror(m, DM_RAID1_READ_ERROR);
50306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
50406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (likely(default_ok(m)) || mirror_available(m->ms, bio)) {
50506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		DMWARN_LIMIT("Read failure on mirror device %s.  "
50606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			     "Trying alternative device.",
50706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			     m->dev->name);
50806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		queue_bio(m->ms, bio, bio_rw(bio));
50906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		return;
51006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	}
51106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
51206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	DMERR_LIMIT("Read failure on mirror device %s.  Failing I/O.",
51306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		    m->dev->name);
51406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	bio_endio(bio, -EIO);
51506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow}
51606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
51706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow/* Asynchronous read. */
51806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic void read_async_bio(struct mirror *m, struct bio *bio)
51906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow{
52022a1ceb1e6a7fbce95a1531ff10bb4fb036d4a37Heinz Mauelshagen	struct dm_io_region io;
52106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct dm_io_request io_req = {
52206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		.bi_rw = READ,
52306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		.mem.type = DM_IO_BVEC,
52406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		.mem.ptr.bvec = bio->bi_io_vec + bio->bi_idx,
52506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		.notify.fn = read_callback,
52606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		.notify.context = bio,
52706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		.client = m->ms->io_client,
52806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	};
52906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
53006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	map_region(&io, m, bio);
53106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	bio_set_m(bio, m);
5321f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	BUG_ON(dm_io(&io_req, 1, &io, NULL));
5331f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen}
5341f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen
5351f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagenstatic inline int region_in_sync(struct mirror_set *ms, region_t region,
5361f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen				 int may_block)
5371f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen{
5381f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	int state = dm_rh_get_state(ms->rh, region, may_block);
5391f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	return state == DM_RH_CLEAN || state == DM_RH_DIRTY;
5401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
5411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
5421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void do_reads(struct mirror_set *ms, struct bio_list *reads)
5431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
5441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	region_t region;
5451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct bio *bio;
5461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror *m;
5471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
5481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	while ((bio = bio_list_pop(reads))) {
5491f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		region = dm_rh_bio_to_region(ms->rh, bio);
55006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		m = get_default_mirror(ms);
5511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
5521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		/*
5531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		 * We can only read balance if the region is in sync.
5541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		 */
5551f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		if (likely(region_in_sync(ms, region, 1)))
5561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			m = choose_mirror(ms, bio->bi_sector);
55706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		else if (m && atomic_read(&m->error_count))
55806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			m = NULL;
5591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
56006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		if (likely(m))
56106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			read_async_bio(m, bio);
56206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		else
56306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			bio_endio(bio, -EIO);
5641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
5651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
5661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
5671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*-----------------------------------------------------------------
5681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Writes.
5691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *
5701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * We do different things with the write io depending on the
5711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * state of the region that it's in:
5721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *
5731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * SYNC: 	increment pending, use kcopyd to write to *all* mirrors
5741da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * RECOVERING:	delay the io until recovery completes
5751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * NOSYNC:	increment pending, just write to the default mirror
5761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/
57772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
57872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
5791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void write_callback(unsigned long error, void *context)
5801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
58172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	unsigned i, ret = 0;
5821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct bio *bio = (struct bio *) context;
5831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms;
58472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	int should_wake = 0;
58572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	unsigned long flags;
5861da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
58706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	ms = bio_get_m(bio)->ms;
58806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	bio_set_m(bio, NULL);
5891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
5901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
5911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * NOTE: We don't decrement the pending count here,
5921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * instead it is done by the targets endio function.
5931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * This way we handle both writes to SYNC and NOSYNC
5941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * regions with the same code.
5951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
59660f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	if (likely(!error)) {
59760f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		bio_endio(bio, ret);
59860f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		return;
59960f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	}
6001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
60172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	for (i = 0; i < ms->nr_mirrors; i++)
60272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		if (test_bit(i, &error))
60372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow			fail_mirror(ms->mirror + i, DM_RAID1_WRITE_ERROR);
60472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
60560f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	/*
60660f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	 * Need to raise event.  Since raising
60760f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	 * events can block, we need to do it in
60860f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	 * the main thread.
60960f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	 */
61060f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	spin_lock_irqsave(&ms->lock, flags);
61160f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	if (!ms->failures.head)
61260f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		should_wake = 1;
61360f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	bio_list_add(&ms->failures, bio);
61460f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	spin_unlock_irqrestore(&ms->lock, flags);
61560f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	if (should_wake)
61660f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		wakeup_mirrord(ms);
6171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
6181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void do_write(struct mirror_set *ms, struct bio *bio)
6201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
6211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	unsigned int i;
62222a1ceb1e6a7fbce95a1531ff10bb4fb036d4a37Heinz Mauelshagen	struct dm_io_region io[ms->nr_mirrors], *dest = io;
6231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror *m;
62488be163abb5324bab09f5eff9646590eec5314ebMilan Broz	struct dm_io_request io_req = {
6254184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka		.bi_rw = WRITE | (bio->bi_rw & WRITE_BARRIER),
62688be163abb5324bab09f5eff9646590eec5314ebMilan Broz		.mem.type = DM_IO_BVEC,
62788be163abb5324bab09f5eff9646590eec5314ebMilan Broz		.mem.ptr.bvec = bio->bi_io_vec + bio->bi_idx,
62888be163abb5324bab09f5eff9646590eec5314ebMilan Broz		.notify.fn = write_callback,
62988be163abb5324bab09f5eff9646590eec5314ebMilan Broz		.notify.context = bio,
63088be163abb5324bab09f5eff9646590eec5314ebMilan Broz		.client = ms->io_client,
63188be163abb5324bab09f5eff9646590eec5314ebMilan Broz	};
6321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
63306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	for (i = 0, m = ms->mirror; i < ms->nr_mirrors; i++, m++)
63406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		map_region(dest++, m, bio);
6351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
63606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	/*
63706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	 * Use default mirror because we only need it to retrieve the reference
63806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	 * to the mirror set in write_callback().
63906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	 */
64006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	bio_set_m(bio, get_default_mirror(ms));
64188be163abb5324bab09f5eff9646590eec5314ebMilan Broz
6421f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	BUG_ON(dm_io(&io_req, ms->nr_mirrors, io, NULL));
6431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
6441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void do_writes(struct mirror_set *ms, struct bio_list *writes)
6461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
6471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int state;
6481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct bio *bio;
6491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct bio_list sync, nosync, recover, *this_list = NULL;
6507513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	struct bio_list requeue;
6517513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
6527513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	region_t region;
6531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (!writes->head)
6551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return;
6561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
6581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * Classify each write.
6591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
6601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	bio_list_init(&sync);
6611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	bio_list_init(&nosync);
6621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	bio_list_init(&recover);
6637513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	bio_list_init(&requeue);
6641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	while ((bio = bio_list_pop(writes))) {
6664184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka		if (unlikely(bio_empty_barrier(bio))) {
6674184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka			bio_list_add(&sync, bio);
6684184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka			continue;
6694184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka		}
6704184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka
6717513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		region = dm_rh_bio_to_region(ms->rh, bio);
6727513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow
6737513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		if (log->type->is_remote_recovering &&
6747513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		    log->type->is_remote_recovering(log, region)) {
6757513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow			bio_list_add(&requeue, bio);
6767513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow			continue;
6777513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		}
6787513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow
6797513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		state = dm_rh_get_state(ms->rh, region, 1);
6801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		switch (state) {
6811f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		case DM_RH_CLEAN:
6821f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		case DM_RH_DIRTY:
6831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			this_list = &sync;
6841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			break;
6851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6861f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		case DM_RH_NOSYNC:
6871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			this_list = &nosync;
6881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			break;
6891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6901f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		case DM_RH_RECOVERING:
6911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			this_list = &recover;
6921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			break;
6931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		}
6941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		bio_list_add(this_list, bio);
6961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
6971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
6997513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	 * Add bios that are delayed due to remote recovery
7007513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	 * back on to the write queue
7017513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	 */
7027513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	if (unlikely(requeue.head)) {
7037513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		spin_lock_irq(&ms->lock);
7047513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		bio_list_merge(&ms->writes, &requeue);
7057513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		spin_unlock_irq(&ms->lock);
70669885683d22d8c05910fd808c01fdce1322739b4Mikulas Patocka		delayed_wake(ms);
7077513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	}
7087513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow
7097513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	/*
7101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * Increment the pending counts for any regions that will
7111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * be written to (writes to recover regions are going to
7121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * be delayed).
7131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
7141f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_rh_inc_pending(ms->rh, &sync);
7151f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_rh_inc_pending(ms->rh, &nosync);
716d2b698644c97cb033261536a4f2010924a00eac9Jonathan Brassow
717d2b698644c97cb033261536a4f2010924a00eac9Jonathan Brassow	/*
718d2b698644c97cb033261536a4f2010924a00eac9Jonathan Brassow	 * If the flush fails on a previous call and succeeds here,
719d2b698644c97cb033261536a4f2010924a00eac9Jonathan Brassow	 * we must not reset the log_failure variable.  We need
720d2b698644c97cb033261536a4f2010924a00eac9Jonathan Brassow	 * userspace interaction to do that.
721d2b698644c97cb033261536a4f2010924a00eac9Jonathan Brassow	 */
722d2b698644c97cb033261536a4f2010924a00eac9Jonathan Brassow	ms->log_failure = dm_rh_flush(ms->rh) ? 1 : ms->log_failure;
7231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
7241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
7251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * Dispatch io.
7261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
727b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	if (unlikely(ms->log_failure)) {
728b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow		spin_lock_irq(&ms->lock);
729b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow		bio_list_merge(&ms->failures, &sync);
730b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow		spin_unlock_irq(&ms->lock);
7311f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		wakeup_mirrord(ms);
732b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	} else
733fc1ff9588a6d56258ff9576a31aa34f17757c666Jonathan Brassow		while ((bio = bio_list_pop(&sync)))
734b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow			do_write(ms, bio);
7351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
7361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	while ((bio = bio_list_pop(&recover)))
7371f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		dm_rh_delay(ms->rh, bio);
7381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
7391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	while ((bio = bio_list_pop(&nosync))) {
740929be8fcb4b4b65d038e73d3bb34715851a95ca2Mikulas Patocka		if (unlikely(ms->leg_failure) && errors_handled(ms))
741929be8fcb4b4b65d038e73d3bb34715851a95ca2Mikulas Patocka			hold_bio(ms, bio);
742929be8fcb4b4b65d038e73d3bb34715851a95ca2Mikulas Patocka		else {
743929be8fcb4b4b65d038e73d3bb34715851a95ca2Mikulas Patocka			map_bio(get_default_mirror(ms), bio);
744929be8fcb4b4b65d038e73d3bb34715851a95ca2Mikulas Patocka			generic_make_request(bio);
745929be8fcb4b4b65d038e73d3bb34715851a95ca2Mikulas Patocka		}
7461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
7471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
7481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
74972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowstatic void do_failures(struct mirror_set *ms, struct bio_list *failures)
75072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow{
75172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct bio *bio;
75272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
7530f398a8403e31c737b429fddc3850093d0bf58d0Mikulas Patocka	if (likely(!failures->head))
75472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		return;
75572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
756b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	/*
757b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * If the log has failed, unattempted writes are being
7580f398a8403e31c737b429fddc3850093d0bf58d0Mikulas Patocka	 * put on the holds list.  We can't issue those writes
759b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * until a log has been marked, so we must store them.
760b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 *
761b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * If a 'noflush' suspend is in progress, we can requeue
762b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * the I/O's to the core.  This give userspace a chance
763b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * to reconfigure the mirror, at which point the core
764b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * will reissue the writes.  If the 'noflush' flag is
765b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * not set, we have no choice but to return errors.
766b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 *
767b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * Some writes on the failures list may have been
768b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * submitted before the log failure and represent a
769b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * failure to write to one of the devices.  It is ok
770b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * for us to treat them the same and requeue them
771b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * as well.
772b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 */
7730f398a8403e31c737b429fddc3850093d0bf58d0Mikulas Patocka	while ((bio = bio_list_pop(failures))) {
77460f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		if (!ms->log_failure) {
7750f398a8403e31c737b429fddc3850093d0bf58d0Mikulas Patocka			ms->in_sync = 0;
776c58098be979509a54021e837a47fcad08db31f94Mikulas Patocka			dm_rh_mark_nosync(ms->rh, bio);
7770f398a8403e31c737b429fddc3850093d0bf58d0Mikulas Patocka		}
77860f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka
77960f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		/*
78060f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		 * If all the legs are dead, fail the I/O.
78160f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		 * If we have been told to handle errors, hold the bio
78260f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		 * and wait for userspace to deal with the problem.
78360f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		 * Otherwise pretend that the I/O succeeded. (This would
78460f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		 * be wrong if the failed leg returned after reboot and
78560f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		 * got replicated back to the good legs.)
78660f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		 */
78760f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		if (!get_valid_mirror(ms))
78860f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka			bio_endio(bio, -EIO);
78960f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		else if (errors_handled(ms))
79060f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka			hold_bio(ms, bio);
79160f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		else
79260f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka			bio_endio(bio, 0);
793b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	}
79472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow}
79572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
79672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowstatic void trigger_event(struct work_struct *work)
79772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow{
79872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct mirror_set *ms =
79972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		container_of(work, struct mirror_set, trigger_event);
80072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
80172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	dm_table_event(ms->ti->table);
80272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow}
80372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
8041da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*-----------------------------------------------------------------
8051da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * kmirrord
8061da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/
807a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patockastatic void do_mirror(struct work_struct *work)
8081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
8091f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct mirror_set *ms = container_of(work, struct mirror_set,
8101f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen					     kmirrord_work);
81172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct bio_list reads, writes, failures;
81272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	unsigned long flags;
8131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
81472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	spin_lock_irqsave(&ms->lock, flags);
8151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	reads = ms->reads;
8161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	writes = ms->writes;
81772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	failures = ms->failures;
8181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	bio_list_init(&ms->reads);
8191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	bio_list_init(&ms->writes);
82072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	bio_list_init(&ms->failures);
82172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	spin_unlock_irqrestore(&ms->lock, flags);
8221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8231f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_rh_update_states(ms->rh, errors_handled(ms));
8241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	do_recovery(ms);
8251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	do_reads(ms, &reads);
8261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	do_writes(ms, &writes);
82772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	do_failures(ms, &failures);
8287ff14a36159d947872870e7a3e9dcaebc46b23ebMikulas Patocka
8297ff14a36159d947872870e7a3e9dcaebc46b23ebMikulas Patocka	dm_table_unplug_all(ms->ti->table);
8301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
8311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*-----------------------------------------------------------------
8331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Target functions
8341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/
8351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic struct mirror_set *alloc_context(unsigned int nr_mirrors,
8361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds					uint32_t region_size,
8371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds					struct dm_target *ti,
838416cd17b1982217bca3dc41b9f00b0b38fdaadadHeinz Mauelshagen					struct dm_dirty_log *dl)
8391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
8401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	size_t len;
8411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms = NULL;
8421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	len = sizeof(*ms) + (sizeof(ms->mirror[0]) * nr_mirrors);
8441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
845dd00cc486ab1c17049a535413d1751ef3482141cYoann Padioleau	ms = kzalloc(len, GFP_KERNEL);
8461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (!ms) {
84772d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Cannot allocate mirror context";
8481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return NULL;
8491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
8501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	spin_lock_init(&ms->lock);
8525339fc2d47d1d720e027b9b832bf5aae8fba2ac0Mikulas Patocka	bio_list_init(&ms->reads);
8535339fc2d47d1d720e027b9b832bf5aae8fba2ac0Mikulas Patocka	bio_list_init(&ms->writes);
8545339fc2d47d1d720e027b9b832bf5aae8fba2ac0Mikulas Patocka	bio_list_init(&ms->failures);
8555339fc2d47d1d720e027b9b832bf5aae8fba2ac0Mikulas Patocka	bio_list_init(&ms->holds);
8561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	ms->ti = ti;
8581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	ms->nr_mirrors = nr_mirrors;
8591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	ms->nr_regions = dm_sector_div_up(ti->len, region_size);
8601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	ms->in_sync = 0;
861b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	ms->log_failure = 0;
862929be8fcb4b4b65d038e73d3bb34715851a95ca2Mikulas Patocka	ms->leg_failure = 0;
863b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	atomic_set(&ms->suspend, 0);
86472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	atomic_set(&ms->default_mirror, DEFAULT_MIRROR);
8651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
86695f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	ms->read_record_pool = mempool_create_slab_pool(MIN_READ_RECORDS,
86795f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka						_dm_raid1_read_record_cache);
86895f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka
86906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (!ms->read_record_pool) {
87006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		ti->error = "Error creating mirror read_record_pool";
87106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		kfree(ms);
87206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		return NULL;
87306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	}
87406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
87588be163abb5324bab09f5eff9646590eec5314ebMilan Broz	ms->io_client = dm_io_client_create(DM_IO_PAGES);
87688be163abb5324bab09f5eff9646590eec5314ebMilan Broz	if (IS_ERR(ms->io_client)) {
87788be163abb5324bab09f5eff9646590eec5314ebMilan Broz		ti->error = "Error creating dm_io client";
87806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		mempool_destroy(ms->read_record_pool);
87988be163abb5324bab09f5eff9646590eec5314ebMilan Broz		kfree(ms);
88088be163abb5324bab09f5eff9646590eec5314ebMilan Broz 		return NULL;
88188be163abb5324bab09f5eff9646590eec5314ebMilan Broz	}
88288be163abb5324bab09f5eff9646590eec5314ebMilan Broz
8831f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	ms->rh = dm_region_hash_create(ms, dispatch_bios, wakeup_mirrord,
8841f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen				       wakeup_all_recovery_waiters,
8851f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen				       ms->ti->begin, MAX_RECOVERY,
8861f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen				       dl, region_size, ms->nr_regions);
8871f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	if (IS_ERR(ms->rh)) {
88872d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Error creating dirty region hash";
889a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov		dm_io_client_destroy(ms->io_client);
89006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		mempool_destroy(ms->read_record_pool);
8911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		kfree(ms);
8921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return NULL;
8931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
8941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	return ms;
8961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
8971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void free_context(struct mirror_set *ms, struct dm_target *ti,
8991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			 unsigned int m)
9001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
9011da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	while (m--)
9021da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		dm_put_device(ti, ms->mirror[m].dev);
9031da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
90488be163abb5324bab09f5eff9646590eec5314ebMilan Broz	dm_io_client_destroy(ms->io_client);
9051f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_region_hash_destroy(ms->rh);
90606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	mempool_destroy(ms->read_record_pool);
9071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	kfree(ms);
9081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
9091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int get_mirror(struct mirror_set *ms, struct dm_target *ti,
9111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		      unsigned int mirror, char **argv)
9121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
9134ee218cd67b385759993a6c840ea45f0ee0a8b30Andrew Morton	unsigned long long offset;
9141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9154ee218cd67b385759993a6c840ea45f0ee0a8b30Andrew Morton	if (sscanf(argv[1], "%llu", &offset) != 1) {
91672d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Invalid offset";
9171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return -EINVAL;
9181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
9191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (dm_get_device(ti, argv[0], offset, ti->len,
9211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			  dm_table_get_mode(ti->table),
9221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			  &ms->mirror[mirror].dev)) {
92372d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Device lookup failure";
9241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return -ENXIO;
9251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
9261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
927aa5617c55357d86c9082ba1d66fa9795370c9954Jonathan Brassow	ms->mirror[mirror].ms = ms;
92872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	atomic_set(&(ms->mirror[mirror].error_count), 0);
92972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	ms->mirror[mirror].error_type = 0;
9301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	ms->mirror[mirror].offset = offset;
9311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	return 0;
9331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
9341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*
9361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Create dirty log: log_type #log_params <log_params>
9371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */
938416cd17b1982217bca3dc41b9f00b0b38fdaadadHeinz Mauelshagenstatic struct dm_dirty_log *create_dirty_log(struct dm_target *ti,
9391f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen					     unsigned argc, char **argv,
9401f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen					     unsigned *args_used)
9411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
9421f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	unsigned param_count;
943416cd17b1982217bca3dc41b9f00b0b38fdaadadHeinz Mauelshagen	struct dm_dirty_log *dl;
9441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (argc < 2) {
94672d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Insufficient mirror log arguments";
9471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return NULL;
9481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
9491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (sscanf(argv[1], "%u", &param_count) != 1) {
95172d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Invalid mirror log argument count";
9521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return NULL;
9531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
9541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	*args_used = 2 + param_count;
9561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (argc < *args_used) {
95872d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Insufficient mirror log arguments";
9591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return NULL;
9601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
9611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
962c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	dl = dm_dirty_log_create(argv[0], ti, mirror_flush, param_count,
963c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka				 argv + 2);
9641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (!dl) {
96572d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Error creating mirror dirty log";
9661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return NULL;
9671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
9681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	return dl;
9701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
9711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
972a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassowstatic int parse_features(struct mirror_set *ms, unsigned argc, char **argv,
973a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow			  unsigned *args_used)
974a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow{
975a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	unsigned num_features;
976a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	struct dm_target *ti = ms->ti;
977a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
978a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	*args_used = 0;
979a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
980a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	if (!argc)
981a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		return 0;
982a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
983a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	if (sscanf(argv[0], "%u", &num_features) != 1) {
984a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		ti->error = "Invalid number of features";
985a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		return -EINVAL;
986a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	}
987a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
988a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	argc--;
989a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	argv++;
990a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	(*args_used)++;
991a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
992a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	if (num_features > argc) {
993a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		ti->error = "Not enough arguments to support feature count";
994a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		return -EINVAL;
995a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	}
996a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
997a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	if (!strcmp("handle_errors", argv[0]))
998a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		ms->features |= DM_RAID1_HANDLE_ERRORS;
999a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	else {
1000a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		ti->error = "Unrecognised feature requested";
1001a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		return -EINVAL;
1002a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	}
1003a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
1004a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	(*args_used)++;
1005a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
1006a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	return 0;
1007a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow}
1008a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
10091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*
10101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Construct a mirror mapping:
10111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *
10121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * log_type #log_params <log_params>
10131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * #mirrors [mirror_path offset]{2,}
1014a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow * [#features <features>]
10151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *
10161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * log_type is "core" or "disk"
10171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * #log_params is between 1 and 3
1018a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow *
1019a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow * If present, features must be "handle_errors".
10201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */
10211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int mirror_ctr(struct dm_target *ti, unsigned int argc, char **argv)
10221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
10231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int r;
10241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	unsigned int nr_mirrors, m, args_used;
10251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms;
1026416cd17b1982217bca3dc41b9f00b0b38fdaadadHeinz Mauelshagen	struct dm_dirty_log *dl;
10271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	dl = create_dirty_log(ti, argc, argv, &args_used);
10291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (!dl)
10301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return -EINVAL;
10311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	argv += args_used;
10331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	argc -= args_used;
10341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (!argc || sscanf(argv[0], "%u", &nr_mirrors) != 1 ||
1036eb69aca5d3370b81450d68edeebc2bb9a3eb9689Heinz Mauelshagen	    nr_mirrors < 2 || nr_mirrors > DM_KCOPYD_MAX_REGIONS + 1) {
103772d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Invalid number of mirrors";
1038416cd17b1982217bca3dc41b9f00b0b38fdaadadHeinz Mauelshagen		dm_dirty_log_destroy(dl);
10391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return -EINVAL;
10401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
10411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	argv++, argc--;
10431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1044a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	if (argc < nr_mirrors * 2) {
1045a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		ti->error = "Too few mirror arguments";
1046416cd17b1982217bca3dc41b9f00b0b38fdaadadHeinz Mauelshagen		dm_dirty_log_destroy(dl);
10471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return -EINVAL;
10481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
10491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	ms = alloc_context(nr_mirrors, dl->type->get_region_size(dl), ti, dl);
10511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (!ms) {
1052416cd17b1982217bca3dc41b9f00b0b38fdaadadHeinz Mauelshagen		dm_dirty_log_destroy(dl);
10531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return -ENOMEM;
10541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
10551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/* Get the mirror parameter sets */
10571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	for (m = 0; m < nr_mirrors; m++) {
10581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		r = get_mirror(ms, ti, m, argv);
10591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		if (r) {
10601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			free_context(ms, ti, m);
10611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			return r;
10621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		}
10631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		argv += 2;
10641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		argc -= 2;
10651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
10661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	ti->private = ms;
10681f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	ti->split_io = dm_rh_get_region_size(ms->rh);
10694184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka	ti->num_flush_requests = 1;
10701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10716ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	ms->kmirrord_wq = create_singlethread_workqueue("kmirrord");
10726ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	if (!ms->kmirrord_wq) {
10736ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski		DMERR("couldn't start kmirrord");
1074a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov		r = -ENOMEM;
1075a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov		goto err_free_context;
10766ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	}
10776ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	INIT_WORK(&ms->kmirrord_work, do_mirror);
1078a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	init_timer(&ms->timer);
1079a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	ms->timer_pending = 0;
108072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	INIT_WORK(&ms->trigger_event, trigger_event);
10816ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski
1082a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	r = parse_features(ms, argc, argv, &args_used);
1083a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov	if (r)
1084a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov		goto err_destroy_wq;
1085a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
1086a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	argv += args_used;
1087a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	argc -= args_used;
1088a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
1089f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	/*
1090f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	 * Any read-balancing addition depends on the
1091f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	 * DM_RAID1_HANDLE_ERRORS flag being present.
1092f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	 * This is because the decision to balance depends
1093f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	 * on the sync state of a region.  If the above
1094f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	 * flag is not present, we ignore errors; and
1095f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	 * the sync state may be inaccurate.
1096f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	 */
1097f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow
1098a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	if (argc) {
1099a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		ti->error = "Too many mirror arguments";
1100a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov		r = -EINVAL;
1101a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov		goto err_destroy_wq;
1102a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	}
1103a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
11041f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	r = dm_kcopyd_client_create(DM_KCOPYD_PAGES, &ms->kcopyd_client);
1105a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov	if (r)
1106a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov		goto err_destroy_wq;
11071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11081f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	wakeup_mirrord(ms);
11091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	return 0;
1110a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov
1111a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhoverr_destroy_wq:
1112a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov	destroy_workqueue(ms->kmirrord_wq);
1113a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhoverr_free_context:
1114a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov	free_context(ms, ti, ms->nr_mirrors);
1115a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov	return r;
11161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
11171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void mirror_dtr(struct dm_target *ti)
11191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
11201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms = (struct mirror_set *) ti->private;
11211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1122a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	del_timer_sync(&ms->timer);
11236ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	flush_workqueue(ms->kmirrord_wq);
112418776c7316545482a02bfaa2629a2aa1afc48357Mikulas Patocka	flush_scheduled_work();
1125eb69aca5d3370b81450d68edeebc2bb9a3eb9689Heinz Mauelshagen	dm_kcopyd_client_destroy(ms->kcopyd_client);
11266ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	destroy_workqueue(ms->kmirrord_wq);
11271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	free_context(ms, ti, ms->nr_mirrors);
11281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
11291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*
11311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Mirror mapping function
11321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */
11331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int mirror_map(struct dm_target *ti, struct bio *bio,
11341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		      union map_info *map_context)
11351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
11361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int r, rw = bio_rw(bio);
11371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror *m;
11381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms = ti->private;
113906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct dm_raid1_read_record *read_record = NULL;
11401f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
11411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (rw == WRITE) {
114306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		/* Save region for mirror_end_io() handler */
11441f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		map_context->ll = dm_rh_bio_to_region(ms->rh, bio);
11451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		queue_bio(ms, bio, rw);
1146d2a7ad29a810441e9dacbaddcc2f0c6045390008Kiyoshi Ueda		return DM_MAPIO_SUBMITTED;
11471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
11481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11491f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	r = log->type->in_sync(log, dm_rh_bio_to_region(ms->rh, bio), 0);
11501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (r < 0 && r != -EWOULDBLOCK)
11511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return r;
11521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
115406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	 * If region is not in-sync queue the bio.
11551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
115606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (!r || (r == -EWOULDBLOCK)) {
115706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		if (rw == READA)
115806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			return -EWOULDBLOCK;
11591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		queue_bio(ms, bio, rw);
1161d2a7ad29a810441e9dacbaddcc2f0c6045390008Kiyoshi Ueda		return DM_MAPIO_SUBMITTED;
11621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
11631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
116406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	/*
116506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	 * The region is in-sync and we can perform reads directly.
116606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	 * Store enough information so we can retry if it fails.
116706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	 */
11681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	m = choose_mirror(ms, bio->bi_sector);
116906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (unlikely(!m))
11701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return -EIO;
11711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
117206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	read_record = mempool_alloc(ms->read_record_pool, GFP_NOIO);
117306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (likely(read_record)) {
117406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		dm_bio_record(&read_record->details, bio);
117506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		map_context->ptr = read_record;
117606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		read_record->m = m;
117706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	}
117806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
117906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	map_bio(m, bio);
118006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
1181d2a7ad29a810441e9dacbaddcc2f0c6045390008Kiyoshi Ueda	return DM_MAPIO_REMAPPED;
11821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
11831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int mirror_end_io(struct dm_target *ti, struct bio *bio,
11851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			 int error, union map_info *map_context)
11861da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
11871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int rw = bio_rw(bio);
11881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms = (struct mirror_set *) ti->private;
118906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct mirror *m = NULL;
119006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct dm_bio_details *bd = NULL;
119106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct dm_raid1_read_record *read_record = map_context->ptr;
11921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
11941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * We need to dec pending if this was a write.
11951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
119606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (rw == WRITE) {
11974184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka		if (likely(!bio_empty_barrier(bio)))
11984184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka			dm_rh_dec(ms->rh, map_context->ll);
119906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		return error;
120006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	}
12011da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
120206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (error == -EOPNOTSUPP)
120306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		goto out;
120406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
12051f98a13f623e0ef666690a18c1250335fc6d7ef1Jens Axboe	if ((error == -EWOULDBLOCK) && bio_rw_flagged(bio, BIO_RW_AHEAD))
120606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		goto out;
120706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
120806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (unlikely(error)) {
120906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		if (!read_record) {
121006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			/*
121106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			 * There wasn't enough memory to record necessary
121206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			 * information for a retry or there was no other
121306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			 * mirror in-sync.
121406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			 */
1215e03f1a842287480aa03732612148c0d333baca61Adrian Bunk			DMERR_LIMIT("Mirror read failed.");
121606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			return -EIO;
121706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		}
1218e03f1a842287480aa03732612148c0d333baca61Adrian Bunk
1219e03f1a842287480aa03732612148c0d333baca61Adrian Bunk		m = read_record->m;
1220e03f1a842287480aa03732612148c0d333baca61Adrian Bunk
122106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		DMERR("Mirror read failed from %s. Trying alternative device.",
122206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		      m->dev->name);
122306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
122406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		fail_mirror(m, DM_RAID1_READ_ERROR);
122506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
122606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		/*
122706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		 * A failed read is requeued for another attempt using an intact
122806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		 * mirror.
122906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		 */
123006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		if (default_ok(m) || mirror_available(ms, bio)) {
123106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			bd = &read_record->details;
123206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
123306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			dm_bio_restore(bd, bio);
123406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			mempool_free(read_record, ms->read_record_pool);
123506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			map_context->ptr = NULL;
123606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			queue_bio(ms, bio, rw);
123706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			return 1;
123806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		}
123906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		DMERR("All replicated volumes dead, failing I/O");
124006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	}
124106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
124206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowout:
124306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (read_record) {
124406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		mempool_free(read_record, ms->read_record_pool);
124506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		map_context->ptr = NULL;
124606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	}
124706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
124806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	return error;
12491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
12501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1251b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassowstatic void mirror_presuspend(struct dm_target *ti)
12521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
12531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms = (struct mirror_set *) ti->private;
12541f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
12551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
125604788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	struct bio_list holds;
125704788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	struct bio *bio;
125804788507686d184d8166918b70ef52311bc36dcbMikulas Patocka
1259b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	atomic_set(&ms->suspend, 1);
1260b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow
1261b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	/*
1262b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * We must finish up all the work that we've
1263b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * generated (i.e. recovery work).
1264b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 */
12651f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_rh_stop_recovery(ms->rh);
126633184048dc4f9d5550d3b6a88c8e0ff92033eb6eJonathan E Brassow
126733184048dc4f9d5550d3b6a88c8e0ff92033eb6eJonathan E Brassow	wait_event(_kmirrord_recovery_stopped,
12681f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		   !dm_rh_recovery_in_flight(ms->rh));
126933184048dc4f9d5550d3b6a88c8e0ff92033eb6eJonathan E Brassow
1270b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	if (log->type->presuspend && log->type->presuspend(log))
1271b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow		/* FIXME: need better error handling */
1272b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow		DMWARN("log presuspend failed");
1273b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow
1274b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	/*
1275b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * Now that recovery is complete/stopped and the
1276b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * delayed bios are queued, we need to wait for
1277b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * the worker thread to complete.  This way,
1278b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * we know that all of our I/O has been pushed.
1279b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 */
1280b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	flush_workqueue(ms->kmirrord_wq);
128104788507686d184d8166918b70ef52311bc36dcbMikulas Patocka
128204788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	/*
128304788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 * Now set ms->suspend is set and the workqueue flushed, no more
128404788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 * entries can be added to ms->hold list, so process it.
128504788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 *
128604788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 * Bios can still arrive concurrently with or after this
128704788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 * presuspend function, but they cannot join the hold list
128804788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 * because ms->suspend is set.
128904788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 */
129004788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	spin_lock_irq(&ms->lock);
129104788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	holds = ms->holds;
129204788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	bio_list_init(&ms->holds);
129304788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	spin_unlock_irq(&ms->lock);
129404788507686d184d8166918b70ef52311bc36dcbMikulas Patocka
129504788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	while ((bio = bio_list_pop(&holds)))
129604788507686d184d8166918b70ef52311bc36dcbMikulas Patocka		hold_bio(ms, bio);
1297b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow}
1298b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow
1299b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassowstatic void mirror_postsuspend(struct dm_target *ti)
1300b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow{
1301b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	struct mirror_set *ms = ti->private;
13021f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
1303b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow
13046b3df0d7a5e85ad2afd3eecc50e2dee59e876ae8Jonathan Brassow	if (log->type->postsuspend && log->type->postsuspend(log))
13051da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		/* FIXME: need better error handling */
1306b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow		DMWARN("log postsuspend failed");
13071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
13081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
13091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void mirror_resume(struct dm_target *ti)
13101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
1311b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	struct mirror_set *ms = ti->private;
13121f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
1313b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow
1314b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	atomic_set(&ms->suspend, 0);
13151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (log->type->resume && log->type->resume(log))
13161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		/* FIXME: need better error handling */
13171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		DMWARN("log resume failed");
13181f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_rh_start_recovery(ms->rh);
13191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
13201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1321af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow/*
1322af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow * device_status_char
1323af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow * @m: mirror device/leg we want the status of
1324af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow *
1325af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow * We return one character representing the most severe error
1326af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow * we have encountered.
1327af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow *    A => Alive - No failures
1328af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow *    D => Dead - A write failure occurred leaving mirror out-of-sync
1329af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow *    S => Sync - A sychronization failure occurred, mirror out-of-sync
1330af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow *    R => Read - A read failure occurred, mirror data unaffected
1331af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow *
1332af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow * Returns: <char>
1333af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow */
1334af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassowstatic char device_status_char(struct mirror *m)
1335af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow{
1336af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow	if (!atomic_read(&(m->error_count)))
1337af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		return 'A';
1338af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow
133964b30c46e866bbff8a9e17883a18636adc358455Mikulas Patocka	return (test_bit(DM_RAID1_FLUSH_ERROR, &(m->error_type))) ? 'F' :
134064b30c46e866bbff8a9e17883a18636adc358455Mikulas Patocka		(test_bit(DM_RAID1_WRITE_ERROR, &(m->error_type))) ? 'D' :
1341af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		(test_bit(DM_RAID1_SYNC_ERROR, &(m->error_type))) ? 'S' :
1342af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		(test_bit(DM_RAID1_READ_ERROR, &(m->error_type))) ? 'R' : 'U';
1343af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow}
1344af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow
1345af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow
13461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int mirror_status(struct dm_target *ti, status_type_t type,
13471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			 char *result, unsigned int maxlen)
13481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
1349315dcc226f066c1d3cef79283dcde807fe0e32d1Jonathan E Brassow	unsigned int m, sz = 0;
13501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms = (struct mirror_set *) ti->private;
13511f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
1352af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow	char buffer[ms->nr_mirrors + 1];
13531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
13541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	switch (type) {
13551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	case STATUSTYPE_INFO:
13561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		DMEMIT("%d ", ms->nr_mirrors);
1357af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		for (m = 0; m < ms->nr_mirrors; m++) {
13581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			DMEMIT("%s ", ms->mirror[m].dev->name);
1359af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow			buffer[m] = device_status_char(&(ms->mirror[m]));
1360af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		}
1361af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		buffer[m] = '\0';
13621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1363af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		DMEMIT("%llu/%llu 1 %s ",
13641f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		      (unsigned long long)log->type->get_sync_count(log),
1365af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		      (unsigned long long)ms->nr_regions, buffer);
1366315dcc226f066c1d3cef79283dcde807fe0e32d1Jonathan E Brassow
13671f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		sz += log->type->status(log, type, result+sz, maxlen-sz);
1368315dcc226f066c1d3cef79283dcde807fe0e32d1Jonathan E Brassow
13691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		break;
13701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
13711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	case STATUSTYPE_TABLE:
13721f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		sz = log->type->status(log, type, result, maxlen);
1373315dcc226f066c1d3cef79283dcde807fe0e32d1Jonathan E Brassow
1374e52b8f6dbe18c879ad2b5013f991ec9e46813043Jonathan Brassow		DMEMIT("%d", ms->nr_mirrors);
13751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		for (m = 0; m < ms->nr_mirrors; m++)
1376e52b8f6dbe18c879ad2b5013f991ec9e46813043Jonathan Brassow			DMEMIT(" %s %llu", ms->mirror[m].dev->name,
1377b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow			       (unsigned long long)ms->mirror[m].offset);
1378a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
1379a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		if (ms->features & DM_RAID1_HANDLE_ERRORS)
1380a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow			DMEMIT(" 1 handle_errors");
13811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
13821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
13831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	return 0;
13841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
13851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1386af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzerstatic int mirror_iterate_devices(struct dm_target *ti,
1387af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer				  iterate_devices_callout_fn fn, void *data)
1388af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer{
1389af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer	struct mirror_set *ms = ti->private;
1390af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer	int ret = 0;
1391af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer	unsigned i;
1392af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer
1393af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer	for (i = 0; !ret && i < ms->nr_mirrors; i++)
1394af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer		ret = fn(ti, ms->mirror[i].dev,
13955dea271b6d87bd1d79a59c1d5baac2596a841c37Mike Snitzer			 ms->mirror[i].offset, ti->len, data);
1396af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer
1397af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer	return ret;
1398af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer}
1399af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer
14001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic struct target_type mirror_target = {
14011da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.name	 = "mirror",
1402af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer	.version = {1, 12, 0},
14031da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.module	 = THIS_MODULE,
14041da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.ctr	 = mirror_ctr,
14051da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.dtr	 = mirror_dtr,
14061da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.map	 = mirror_map,
14071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.end_io	 = mirror_end_io,
1408b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	.presuspend = mirror_presuspend,
14091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.postsuspend = mirror_postsuspend,
14101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.resume	 = mirror_resume,
14111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.status	 = mirror_status,
1412af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer	.iterate_devices = mirror_iterate_devices,
14131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds};
14141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
14151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int __init dm_mirror_init(void)
14161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
14171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int r;
14181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
141995f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	_dm_raid1_read_record_cache = KMEM_CACHE(dm_raid1_read_record, 0);
142095f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	if (!_dm_raid1_read_record_cache) {
142195f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka		DMERR("Can't allocate dm_raid1_read_record cache");
142295f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka		r = -ENOMEM;
142395f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka		goto bad_cache;
142495f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	}
142595f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka
14261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	r = dm_register_target(&mirror_target);
142795f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	if (r < 0) {
14280cd3312434cd1f29bee6bff53bf2790d733ad2a2Alasdair G Kergon		DMERR("Failed to register mirror target");
142995f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka		goto bad_target;
143095f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	}
143195f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka
143295f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	return 0;
14331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
143495f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patockabad_target:
143595f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	kmem_cache_destroy(_dm_raid1_read_record_cache);
143695f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patockabad_cache:
14371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	return r;
14381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
14391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
14401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void __exit dm_mirror_exit(void)
14411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
144210d3bd09a3c25df114f74f7f86e1b58d070bef32Mikulas Patocka	dm_unregister_target(&mirror_target);
144395f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	kmem_cache_destroy(_dm_raid1_read_record_cache);
14441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
14451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
14461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/* Module hooks */
14471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsmodule_init(dm_mirror_init);
14481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsmodule_exit(dm_mirror_exit);
14491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
14501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus TorvaldsMODULE_DESCRIPTION(DM_NAME " mirror target");
14511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus TorvaldsMODULE_AUTHOR("Joe Thornber");
14521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus TorvaldsMODULE_LICENSE("GPL");
1453