dm-raid1.c revision 0f398a8403e31c737b429fddc3850093d0bf58d0
11da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*
21da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Copyright (C) 2003 Sistina Software Limited.
31f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen * Copyright (C) 2005-2008 Red Hat, Inc. All rights reserved.
41da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *
51da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * This file is released under the GPL.
61da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */
71da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow#include "dm-bio-record.h"
91da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/init.h>
111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/mempool.h>
121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/module.h>
131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/pagemap.h>
141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/slab.h>
151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/workqueue.h>
161f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen#include <linux/device-mapper.h>
17a765e20eeb423d0fa6a02ffab51141e53bbd93cbAlasdair G Kergon#include <linux/dm-io.h>
18a765e20eeb423d0fa6a02ffab51141e53bbd93cbAlasdair G Kergon#include <linux/dm-dirty-log.h>
19a765e20eeb423d0fa6a02ffab51141e53bbd93cbAlasdair G Kergon#include <linux/dm-kcopyd.h>
201f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen#include <linux/dm-region-hash.h>
211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
2272d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon#define DM_MSG_PREFIX "raid1"
231f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen
241f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen#define MAX_RECOVERY 1	/* Maximum number of regions recovered in parallel. */
2588be163abb5324bab09f5eff9646590eec5314ebMilan Broz#define DM_IO_PAGES 64
261f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen#define DM_KCOPYD_PAGES 64
2772d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon
28a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow#define DM_RAID1_HANDLE_ERRORS 0x01
29f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow#define errors_handled(p)	((p)->features & DM_RAID1_HANDLE_ERRORS)
30a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
3133184048dc4f9d5550d3b6a88c8e0ff92033eb6eJonathan E Brassowstatic DECLARE_WAIT_QUEUE_HEAD(_kmirrord_recovery_stopped);
321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*-----------------------------------------------------------------
34e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown * Mirror set structures.
35e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown *---------------------------------------------------------------*/
3672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowenum dm_raid1_error {
3772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	DM_RAID1_WRITE_ERROR,
3864b30c46e866bbff8a9e17883a18636adc358455Mikulas Patocka	DM_RAID1_FLUSH_ERROR,
3972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	DM_RAID1_SYNC_ERROR,
4072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	DM_RAID1_READ_ERROR
4172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow};
4272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
43e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brownstruct mirror {
44aa5617c55357d86c9082ba1d66fa9795370c9954Jonathan Brassow	struct mirror_set *ms;
45e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	atomic_t error_count;
4639ed7adb17bdec8224bd3fae551bb7222e05f35bAl Viro	unsigned long error_type;
47e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	struct dm_dev *dev;
48e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	sector_t offset;
49e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown};
50e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown
51e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brownstruct mirror_set {
52e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	struct dm_target *ti;
53e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	struct list_head list;
541f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen
55a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	uint64_t features;
56e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown
5772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	spinlock_t lock;	/* protects the lists */
58e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	struct bio_list reads;
59e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	struct bio_list writes;
6072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct bio_list failures;
6104788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	struct bio_list holds;	/* bios are waiting until suspend */
62e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown
631f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_region_hash *rh;
641f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_kcopyd_client *kcopyd_client;
6588be163abb5324bab09f5eff9646590eec5314ebMilan Broz	struct dm_io_client *io_client;
6606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	mempool_t *read_record_pool;
6788be163abb5324bab09f5eff9646590eec5314ebMilan Broz
68e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	/* recovery */
69e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	region_t nr_regions;
70e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	int in_sync;
71fc1ff9588a6d56258ff9576a31aa34f17757c666Jonathan Brassow	int log_failure;
72b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	atomic_t suspend;
73e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown
7472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	atomic_t default_mirror;	/* Default mirror */
75e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown
766ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	struct workqueue_struct *kmirrord_wq;
776ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	struct work_struct kmirrord_work;
78a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	struct timer_list timer;
79a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	unsigned long timer_pending;
80a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka
8172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct work_struct trigger_event;
826ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski
831f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	unsigned nr_mirrors;
84e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	struct mirror mirror[0];
85e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown};
86e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown
871f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagenstatic void wakeup_mirrord(void *context)
881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
891f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct mirror_set *ms = context;
901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
916ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	queue_work(ms->kmirrord_wq, &ms->kmirrord_work);
926ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski}
936ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski
94a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patockastatic void delayed_wake_fn(unsigned long data)
95a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka{
96a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	struct mirror_set *ms = (struct mirror_set *) data;
97a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka
98a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	clear_bit(0, &ms->timer_pending);
991f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	wakeup_mirrord(ms);
100a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka}
101a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka
102a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patockastatic void delayed_wake(struct mirror_set *ms)
103a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka{
104a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	if (test_and_set_bit(0, &ms->timer_pending))
105a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka		return;
106a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka
107a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	ms->timer.expires = jiffies + HZ / 5;
108a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	ms->timer.data = (unsigned long) ms;
109a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	ms->timer.function = delayed_wake_fn;
110a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	add_timer(&ms->timer);
111a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka}
112a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka
1131f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagenstatic void wakeup_all_recovery_waiters(void *context)
1141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
1151f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	wake_up_all(&_kmirrord_recovery_stopped);
1161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
1171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1181f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagenstatic void queue_bio(struct mirror_set *ms, struct bio *bio, int rw)
1191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
1201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	unsigned long flags;
1211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int should_wake = 0;
1221f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct bio_list *bl;
1231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1241f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	bl = (rw == WRITE) ? &ms->writes : &ms->reads;
1251f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	spin_lock_irqsave(&ms->lock, flags);
1261f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	should_wake = !(bl->head);
1271f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	bio_list_add(bl, bio);
1281f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	spin_unlock_irqrestore(&ms->lock, flags);
1291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (should_wake)
1311f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		wakeup_mirrord(ms);
1321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
1331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1341f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagenstatic void dispatch_bios(void *context, struct bio_list *bio_list)
1351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
1361f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct mirror_set *ms = context;
1371f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct bio *bio;
1381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1391f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	while ((bio = bio_list_pop(bio_list)))
1401f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		queue_bio(ms, bio, WRITE);
1411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
1421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
14306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow#define MIN_READ_RECORDS 20
14406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstruct dm_raid1_read_record {
14506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct mirror *m;
14606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct dm_bio_details details;
14706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow};
14806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
14995f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patockastatic struct kmem_cache *_dm_raid1_read_record_cache;
15095f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka
1511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*
1521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Every mirror should look like this one.
1531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */
1541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#define DEFAULT_MIRROR 0
1551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*
15706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow * This is yucky.  We squirrel the mirror struct away inside
15806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow * bi_next for read/write buffers.  This is safe since the bh
1591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * doesn't get submitted to the lower levels of block layer.
1601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */
16106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic struct mirror *bio_get_m(struct bio *bio)
1621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
16306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	return (struct mirror *) bio->bi_next;
1641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
1651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
16606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic void bio_set_m(struct bio *bio, struct mirror *m)
1671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
16806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	bio->bi_next = (struct bio *) m;
1691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
1701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
17172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowstatic struct mirror *get_default_mirror(struct mirror_set *ms)
17272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow{
17372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	return &ms->mirror[atomic_read(&ms->default_mirror)];
17472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow}
17572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
17672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowstatic void set_default_mirror(struct mirror *m)
17772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow{
17872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct mirror_set *ms = m->ms;
17972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct mirror *m0 = &(ms->mirror[0]);
18072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
18172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	atomic_set(&ms->default_mirror, m - m0);
18272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow}
18372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
18472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow/* fail_mirror
18572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * @m: mirror device to fail
18672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * @error_type: one of the enum's, DM_RAID1_*_ERROR
18772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow *
18872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * If errors are being handled, record the type of
18972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * error encountered for this device.  If this type
19072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * of error has already been recorded, we can return;
19172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * otherwise, we must signal userspace by triggering
19272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * an event.  Additionally, if the device is the
19372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * primary device, we must choose a new primary, but
19472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * only if the mirror is in-sync.
19572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow *
19672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * This function must not block.
19772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow */
19872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowstatic void fail_mirror(struct mirror *m, enum dm_raid1_error error_type)
19972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow{
20072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct mirror_set *ms = m->ms;
20172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct mirror *new;
20272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
20372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	/*
20472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	 * error_count is used for nothing more than a
20572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	 * simple way to tell if a device has encountered
20672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	 * errors.
20772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	 */
20872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	atomic_inc(&m->error_count);
20972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
21072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	if (test_and_set_bit(error_type, &m->error_type))
21172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		return;
21272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
213d460c65a6a9ec9e0d284864ec3a9a2d1b73f0e43Jonathan Brassow	if (!errors_handled(ms))
214d460c65a6a9ec9e0d284864ec3a9a2d1b73f0e43Jonathan Brassow		return;
215d460c65a6a9ec9e0d284864ec3a9a2d1b73f0e43Jonathan Brassow
21672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	if (m != get_default_mirror(ms))
21772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		goto out;
21872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
21972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	if (!ms->in_sync) {
22072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		/*
22172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		 * Better to issue requests to same failing device
22272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		 * than to risk returning corrupt data.
22372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		 */
22472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		DMERR("Primary mirror (%s) failed while out-of-sync: "
22572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		      "Reads may fail.", m->dev->name);
22672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		goto out;
22772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	}
22872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
22972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	for (new = ms->mirror; new < ms->mirror + ms->nr_mirrors; new++)
23072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		if (!atomic_read(&new->error_count)) {
23172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow			set_default_mirror(new);
23272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow			break;
23372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		}
23472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
23572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	if (unlikely(new == ms->mirror + ms->nr_mirrors))
23672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		DMWARN("All sides of mirror have failed.");
23772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
23872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowout:
23972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	schedule_work(&ms->trigger_event);
24072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow}
24172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
242c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patockastatic int mirror_flush(struct dm_target *ti)
243c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka{
244c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	struct mirror_set *ms = ti->private;
245c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	unsigned long error_bits;
246c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka
247c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	unsigned int i;
248c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	struct dm_io_region io[ms->nr_mirrors];
249c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	struct mirror *m;
250c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	struct dm_io_request io_req = {
251c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		.bi_rw = WRITE_BARRIER,
252c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		.mem.type = DM_IO_KMEM,
253c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		.mem.ptr.bvec = NULL,
254c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		.client = ms->io_client,
255c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	};
256c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka
257c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	for (i = 0, m = ms->mirror; i < ms->nr_mirrors; i++, m++) {
258c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		io[i].bdev = m->dev->bdev;
259c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		io[i].sector = 0;
260c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		io[i].count = 0;
261c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	}
262c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka
263c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	error_bits = -1;
264c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	dm_io(&io_req, ms->nr_mirrors, io, &error_bits);
265c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	if (unlikely(error_bits != 0)) {
266c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		for (i = 0; i < ms->nr_mirrors; i++)
267c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka			if (test_bit(i, &error_bits))
268c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka				fail_mirror(ms->mirror + i,
26964b30c46e866bbff8a9e17883a18636adc358455Mikulas Patocka					    DM_RAID1_FLUSH_ERROR);
270c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		return -EIO;
271c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	}
272c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka
273c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	return 0;
274c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka}
275c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka
2761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*-----------------------------------------------------------------
2771da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Recovery.
2781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *
2791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * When a mirror is first activated we may find that some regions
2801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * are in the no-sync state.  We have to recover these by
2811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * recopying from the default mirror to all the others.
2821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/
2834cdc1d1fa5c5ac14dc21be19832f02fd0b83867eAlasdair G Kergonstatic void recovery_complete(int read_err, unsigned long write_err,
2841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			      void *context)
2851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
2861f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_region *reg = context;
2871f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct mirror_set *ms = dm_rh_region_context(reg);
2888f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow	int m, bit = 0;
2891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
2908f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow	if (read_err) {
291f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow		/* Read error means the failure of default mirror. */
292f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow		DMERR_LIMIT("Unable to read primary mirror during recovery");
2938f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow		fail_mirror(get_default_mirror(ms), DM_RAID1_SYNC_ERROR);
2948f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow	}
295f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow
2968f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow	if (write_err) {
2974cdc1d1fa5c5ac14dc21be19832f02fd0b83867eAlasdair G Kergon		DMERR_LIMIT("Write error during recovery (error = 0x%lx)",
298f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow			    write_err);
2998f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow		/*
3008f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow		 * Bits correspond to devices (excluding default mirror).
3018f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow		 * The default mirror cannot change during recovery.
3028f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow		 */
3038f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow		for (m = 0; m < ms->nr_mirrors; m++) {
3048f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow			if (&ms->mirror[m] == get_default_mirror(ms))
3058f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow				continue;
3068f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow			if (test_bit(bit, &write_err))
3078f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow				fail_mirror(ms->mirror + m,
3088f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow					    DM_RAID1_SYNC_ERROR);
3098f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow			bit++;
3108f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow		}
3118f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow	}
312f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow
3131f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_rh_recovery_end(reg, !(read_err || write_err));
3141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
3151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3161f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagenstatic int recover(struct mirror_set *ms, struct dm_region *reg)
3171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
3181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int r;
3191f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	unsigned i;
320eb69aca5d3370b81450d68edeebc2bb9a3eb9689Heinz Mauelshagen	struct dm_io_region from, to[DM_KCOPYD_MAX_REGIONS], *dest;
3211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror *m;
3221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	unsigned long flags = 0;
3231f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	region_t key = dm_rh_get_region_key(reg);
3241f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	sector_t region_size = dm_rh_get_region_size(ms->rh);
3251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/* fill in the source */
32772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	m = get_default_mirror(ms);
3281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	from.bdev = m->dev->bdev;
3291f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	from.sector = m->offset + dm_rh_region_to_sector(ms->rh, key);
3301f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	if (key == (ms->nr_regions - 1)) {
3311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		/*
3321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		 * The final region may be smaller than
3331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		 * region_size.
3341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		 */
3351f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		from.count = ms->ti->len & (region_size - 1);
3361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		if (!from.count)
3371f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen			from.count = region_size;
3381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	} else
3391f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		from.count = region_size;
3401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/* fill in the destinations */
3421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	for (i = 0, dest = to; i < ms->nr_mirrors; i++) {
34372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		if (&ms->mirror[i] == get_default_mirror(ms))
3441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			continue;
3451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		m = ms->mirror + i;
3471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		dest->bdev = m->dev->bdev;
3481f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		dest->sector = m->offset + dm_rh_region_to_sector(ms->rh, key);
3491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		dest->count = from.count;
3501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		dest++;
3511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
3521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/* hand to kcopyd */
354f7c83e2e4783c4f7abe6f3a85a8c5e210f98bc7bJonathan Brassow	if (!errors_handled(ms))
355f7c83e2e4783c4f7abe6f3a85a8c5e210f98bc7bJonathan Brassow		set_bit(DM_KCOPYD_IGNORE_ERROR, &flags);
356f7c83e2e4783c4f7abe6f3a85a8c5e210f98bc7bJonathan Brassow
357eb69aca5d3370b81450d68edeebc2bb9a3eb9689Heinz Mauelshagen	r = dm_kcopyd_copy(ms->kcopyd_client, &from, ms->nr_mirrors - 1, to,
358eb69aca5d3370b81450d68edeebc2bb9a3eb9689Heinz Mauelshagen			   flags, recovery_complete, reg);
3591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	return r;
3611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
3621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void do_recovery(struct mirror_set *ms)
3641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
3651f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_region *reg;
3661f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
3671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int r;
3681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
3701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * Start quiescing some regions.
3711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
3721f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_rh_recovery_prepare(ms->rh);
3731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3741da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
3751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * Copy any already quiesced regions.
3761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
3771f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	while ((reg = dm_rh_recovery_start(ms->rh))) {
3781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		r = recover(ms, reg);
3791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		if (r)
3801f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen			dm_rh_recovery_end(reg, 0);
3811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
3821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
3841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * Update the in sync flag.
3851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
3861da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (!ms->in_sync &&
3871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	    (log->type->get_sync_count(log) == ms->nr_regions)) {
3881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		/* the sync is complete */
3891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		dm_table_event(ms->ti->table);
3901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		ms->in_sync = 1;
3911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
3921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
3931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*-----------------------------------------------------------------
3951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Reads
3961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/
3971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic struct mirror *choose_mirror(struct mirror_set *ms, sector_t sector)
3981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
39906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct mirror *m = get_default_mirror(ms);
40006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
40106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	do {
40206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		if (likely(!atomic_read(&m->error_count)))
40306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			return m;
40406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
40506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		if (m-- == ms->mirror)
40606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			m += ms->nr_mirrors;
40706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	} while (m != get_default_mirror(ms));
40806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
40906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	return NULL;
41006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow}
41106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
41206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic int default_ok(struct mirror *m)
41306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow{
41406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct mirror *default_mirror = get_default_mirror(m->ms);
41506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
41606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	return !atomic_read(&default_mirror->error_count);
41706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow}
41806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
41906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic int mirror_available(struct mirror_set *ms, struct bio *bio)
42006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow{
4211f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
4221f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	region_t region = dm_rh_bio_to_region(ms->rh, bio);
42306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
4241f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	if (log->type->in_sync(log, region, 0))
42506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		return choose_mirror(ms,  bio->bi_sector) ? 1 : 0;
42606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
42706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	return 0;
4281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
4291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
4301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*
4311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * remap a buffer to a particular mirror.
4321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */
43306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic sector_t map_sector(struct mirror *m, struct bio *bio)
43406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow{
4354184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka	if (unlikely(!bio->bi_size))
4364184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka		return 0;
43706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	return m->offset + (bio->bi_sector - m->ms->ti->begin);
43806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow}
43906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
44006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic void map_bio(struct mirror *m, struct bio *bio)
4411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
4421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	bio->bi_bdev = m->dev->bdev;
44306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	bio->bi_sector = map_sector(m, bio);
44406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow}
44506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
44622a1ceb1e6a7fbce95a1531ff10bb4fb036d4a37Heinz Mauelshagenstatic void map_region(struct dm_io_region *io, struct mirror *m,
44706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		       struct bio *bio)
44806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow{
44906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	io->bdev = m->dev->bdev;
45006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	io->sector = map_sector(m, bio);
45106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	io->count = bio->bi_size >> 9;
45206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow}
45306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
45404788507686d184d8166918b70ef52311bc36dcbMikulas Patockastatic void hold_bio(struct mirror_set *ms, struct bio *bio)
45504788507686d184d8166918b70ef52311bc36dcbMikulas Patocka{
45604788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	/*
45704788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 * If device is suspended, complete the bio.
45804788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 */
45904788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	if (atomic_read(&ms->suspend)) {
46004788507686d184d8166918b70ef52311bc36dcbMikulas Patocka		if (dm_noflush_suspending(ms->ti))
46104788507686d184d8166918b70ef52311bc36dcbMikulas Patocka			bio_endio(bio, DM_ENDIO_REQUEUE);
46204788507686d184d8166918b70ef52311bc36dcbMikulas Patocka		else
46304788507686d184d8166918b70ef52311bc36dcbMikulas Patocka			bio_endio(bio, -EIO);
46404788507686d184d8166918b70ef52311bc36dcbMikulas Patocka		return;
46504788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	}
46604788507686d184d8166918b70ef52311bc36dcbMikulas Patocka
46704788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	/*
46804788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 * Hold bio until the suspend is complete.
46904788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 */
47004788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	spin_lock_irq(&ms->lock);
47104788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	bio_list_add(&ms->holds, bio);
47204788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	spin_unlock_irq(&ms->lock);
47304788507686d184d8166918b70ef52311bc36dcbMikulas Patocka}
47404788507686d184d8166918b70ef52311bc36dcbMikulas Patocka
47506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow/*-----------------------------------------------------------------
47606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow * Reads
47706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow *---------------------------------------------------------------*/
47806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic void read_callback(unsigned long error, void *context)
47906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow{
48006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct bio *bio = context;
48106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct mirror *m;
48206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
48306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	m = bio_get_m(bio);
48406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	bio_set_m(bio, NULL);
48506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
48606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (likely(!error)) {
48706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		bio_endio(bio, 0);
48806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		return;
48906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	}
49006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
49106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	fail_mirror(m, DM_RAID1_READ_ERROR);
49206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
49306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (likely(default_ok(m)) || mirror_available(m->ms, bio)) {
49406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		DMWARN_LIMIT("Read failure on mirror device %s.  "
49506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			     "Trying alternative device.",
49606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			     m->dev->name);
49706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		queue_bio(m->ms, bio, bio_rw(bio));
49806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		return;
49906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	}
50006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
50106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	DMERR_LIMIT("Read failure on mirror device %s.  Failing I/O.",
50206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		    m->dev->name);
50306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	bio_endio(bio, -EIO);
50406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow}
50506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
50606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow/* Asynchronous read. */
50706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic void read_async_bio(struct mirror *m, struct bio *bio)
50806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow{
50922a1ceb1e6a7fbce95a1531ff10bb4fb036d4a37Heinz Mauelshagen	struct dm_io_region io;
51006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct dm_io_request io_req = {
51106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		.bi_rw = READ,
51206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		.mem.type = DM_IO_BVEC,
51306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		.mem.ptr.bvec = bio->bi_io_vec + bio->bi_idx,
51406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		.notify.fn = read_callback,
51506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		.notify.context = bio,
51606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		.client = m->ms->io_client,
51706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	};
51806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
51906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	map_region(&io, m, bio);
52006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	bio_set_m(bio, m);
5211f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	BUG_ON(dm_io(&io_req, 1, &io, NULL));
5221f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen}
5231f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen
5241f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagenstatic inline int region_in_sync(struct mirror_set *ms, region_t region,
5251f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen				 int may_block)
5261f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen{
5271f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	int state = dm_rh_get_state(ms->rh, region, may_block);
5281f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	return state == DM_RH_CLEAN || state == DM_RH_DIRTY;
5291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
5301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
5311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void do_reads(struct mirror_set *ms, struct bio_list *reads)
5321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
5331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	region_t region;
5341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct bio *bio;
5351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror *m;
5361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
5371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	while ((bio = bio_list_pop(reads))) {
5381f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		region = dm_rh_bio_to_region(ms->rh, bio);
53906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		m = get_default_mirror(ms);
5401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
5411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		/*
5421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		 * We can only read balance if the region is in sync.
5431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		 */
5441f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		if (likely(region_in_sync(ms, region, 1)))
5451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			m = choose_mirror(ms, bio->bi_sector);
54606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		else if (m && atomic_read(&m->error_count))
54706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			m = NULL;
5481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
54906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		if (likely(m))
55006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			read_async_bio(m, bio);
55106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		else
55206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			bio_endio(bio, -EIO);
5531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
5541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
5551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
5561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*-----------------------------------------------------------------
5571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Writes.
5581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *
5591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * We do different things with the write io depending on the
5601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * state of the region that it's in:
5611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *
5621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * SYNC: 	increment pending, use kcopyd to write to *all* mirrors
5631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * RECOVERING:	delay the io until recovery completes
5641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * NOSYNC:	increment pending, just write to the default mirror
5651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/
56672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
56772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
5681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void write_callback(unsigned long error, void *context)
5691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
57072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	unsigned i, ret = 0;
5711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct bio *bio = (struct bio *) context;
5721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms;
57372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	int uptodate = 0;
57472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	int should_wake = 0;
57572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	unsigned long flags;
5761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
57706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	ms = bio_get_m(bio)->ms;
57806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	bio_set_m(bio, NULL);
5791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
5801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
5811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * NOTE: We don't decrement the pending count here,
5821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * instead it is done by the targets endio function.
5831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * This way we handle both writes to SYNC and NOSYNC
5841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * regions with the same code.
5851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
58672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	if (likely(!error))
58772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		goto out;
5881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
58972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	for (i = 0; i < ms->nr_mirrors; i++)
59072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		if (test_bit(i, &error))
59172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow			fail_mirror(ms->mirror + i, DM_RAID1_WRITE_ERROR);
59272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		else
59372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow			uptodate = 1;
59472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
59572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	if (unlikely(!uptodate)) {
59672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		DMERR("All replicated volumes dead, failing I/O");
59772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		/* None of the writes succeeded, fail the I/O. */
59872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		ret = -EIO;
59972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	} else if (errors_handled(ms)) {
6001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		/*
60172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		 * Need to raise event.  Since raising
60272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		 * events can block, we need to do it in
60372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		 * the main thread.
6041da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		 */
60572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		spin_lock_irqsave(&ms->lock, flags);
60672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		if (!ms->failures.head)
60772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow			should_wake = 1;
60872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		bio_list_add(&ms->failures, bio);
60972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		spin_unlock_irqrestore(&ms->lock, flags);
61072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		if (should_wake)
6111f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen			wakeup_mirrord(ms);
61272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		return;
6131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
61472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowout:
61572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	bio_endio(bio, ret);
6161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
6171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void do_write(struct mirror_set *ms, struct bio *bio)
6191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
6201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	unsigned int i;
62122a1ceb1e6a7fbce95a1531ff10bb4fb036d4a37Heinz Mauelshagen	struct dm_io_region io[ms->nr_mirrors], *dest = io;
6221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror *m;
62388be163abb5324bab09f5eff9646590eec5314ebMilan Broz	struct dm_io_request io_req = {
6244184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka		.bi_rw = WRITE | (bio->bi_rw & WRITE_BARRIER),
62588be163abb5324bab09f5eff9646590eec5314ebMilan Broz		.mem.type = DM_IO_BVEC,
62688be163abb5324bab09f5eff9646590eec5314ebMilan Broz		.mem.ptr.bvec = bio->bi_io_vec + bio->bi_idx,
62788be163abb5324bab09f5eff9646590eec5314ebMilan Broz		.notify.fn = write_callback,
62888be163abb5324bab09f5eff9646590eec5314ebMilan Broz		.notify.context = bio,
62988be163abb5324bab09f5eff9646590eec5314ebMilan Broz		.client = ms->io_client,
63088be163abb5324bab09f5eff9646590eec5314ebMilan Broz	};
6311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
63206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	for (i = 0, m = ms->mirror; i < ms->nr_mirrors; i++, m++)
63306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		map_region(dest++, m, bio);
6341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
63506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	/*
63606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	 * Use default mirror because we only need it to retrieve the reference
63706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	 * to the mirror set in write_callback().
63806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	 */
63906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	bio_set_m(bio, get_default_mirror(ms));
64088be163abb5324bab09f5eff9646590eec5314ebMilan Broz
6411f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	BUG_ON(dm_io(&io_req, ms->nr_mirrors, io, NULL));
6421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
6431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void do_writes(struct mirror_set *ms, struct bio_list *writes)
6451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
6461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int state;
6471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct bio *bio;
6481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct bio_list sync, nosync, recover, *this_list = NULL;
6497513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	struct bio_list requeue;
6507513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
6517513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	region_t region;
6521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (!writes->head)
6541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return;
6551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
6571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * Classify each write.
6581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
6591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	bio_list_init(&sync);
6601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	bio_list_init(&nosync);
6611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	bio_list_init(&recover);
6627513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	bio_list_init(&requeue);
6631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	while ((bio = bio_list_pop(writes))) {
6654184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka		if (unlikely(bio_empty_barrier(bio))) {
6664184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka			bio_list_add(&sync, bio);
6674184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka			continue;
6684184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka		}
6694184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka
6707513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		region = dm_rh_bio_to_region(ms->rh, bio);
6717513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow
6727513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		if (log->type->is_remote_recovering &&
6737513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		    log->type->is_remote_recovering(log, region)) {
6747513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow			bio_list_add(&requeue, bio);
6757513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow			continue;
6767513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		}
6777513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow
6787513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		state = dm_rh_get_state(ms->rh, region, 1);
6791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		switch (state) {
6801f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		case DM_RH_CLEAN:
6811f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		case DM_RH_DIRTY:
6821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			this_list = &sync;
6831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			break;
6841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6851f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		case DM_RH_NOSYNC:
6861da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			this_list = &nosync;
6871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			break;
6881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6891f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		case DM_RH_RECOVERING:
6901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			this_list = &recover;
6911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			break;
6921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		}
6931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		bio_list_add(this_list, bio);
6951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
6961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
6987513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	 * Add bios that are delayed due to remote recovery
6997513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	 * back on to the write queue
7007513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	 */
7017513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	if (unlikely(requeue.head)) {
7027513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		spin_lock_irq(&ms->lock);
7037513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		bio_list_merge(&ms->writes, &requeue);
7047513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		spin_unlock_irq(&ms->lock);
70569885683d22d8c05910fd808c01fdce1322739b4Mikulas Patocka		delayed_wake(ms);
7067513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	}
7077513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow
7087513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	/*
7091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * Increment the pending counts for any regions that will
7101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * be written to (writes to recover regions are going to
7111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * be delayed).
7121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
7131f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_rh_inc_pending(ms->rh, &sync);
7141f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_rh_inc_pending(ms->rh, &nosync);
715d2b698644c97cb033261536a4f2010924a00eac9Jonathan Brassow
716d2b698644c97cb033261536a4f2010924a00eac9Jonathan Brassow	/*
717d2b698644c97cb033261536a4f2010924a00eac9Jonathan Brassow	 * If the flush fails on a previous call and succeeds here,
718d2b698644c97cb033261536a4f2010924a00eac9Jonathan Brassow	 * we must not reset the log_failure variable.  We need
719d2b698644c97cb033261536a4f2010924a00eac9Jonathan Brassow	 * userspace interaction to do that.
720d2b698644c97cb033261536a4f2010924a00eac9Jonathan Brassow	 */
721d2b698644c97cb033261536a4f2010924a00eac9Jonathan Brassow	ms->log_failure = dm_rh_flush(ms->rh) ? 1 : ms->log_failure;
7221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
7231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
7241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * Dispatch io.
7251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
726b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	if (unlikely(ms->log_failure)) {
727b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow		spin_lock_irq(&ms->lock);
728b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow		bio_list_merge(&ms->failures, &sync);
729b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow		spin_unlock_irq(&ms->lock);
7301f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		wakeup_mirrord(ms);
731b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	} else
732fc1ff9588a6d56258ff9576a31aa34f17757c666Jonathan Brassow		while ((bio = bio_list_pop(&sync)))
733b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow			do_write(ms, bio);
7341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
7351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	while ((bio = bio_list_pop(&recover)))
7361f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		dm_rh_delay(ms->rh, bio);
7371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
7381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	while ((bio = bio_list_pop(&nosync))) {
73906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		map_bio(get_default_mirror(ms), bio);
7401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		generic_make_request(bio);
7411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
7421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
7431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
74472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowstatic void do_failures(struct mirror_set *ms, struct bio_list *failures)
74572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow{
74672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct bio *bio;
74772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
7480f398a8403e31c737b429fddc3850093d0bf58d0Mikulas Patocka	if (likely(!failures->head))
74972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		return;
75072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
751b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	/*
752b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * If the log has failed, unattempted writes are being
7530f398a8403e31c737b429fddc3850093d0bf58d0Mikulas Patocka	 * put on the holds list.  We can't issue those writes
754b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * until a log has been marked, so we must store them.
755b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 *
756b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * If a 'noflush' suspend is in progress, we can requeue
757b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * the I/O's to the core.  This give userspace a chance
758b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * to reconfigure the mirror, at which point the core
759b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * will reissue the writes.  If the 'noflush' flag is
760b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * not set, we have no choice but to return errors.
761b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 *
762b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * Some writes on the failures list may have been
763b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * submitted before the log failure and represent a
764b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * failure to write to one of the devices.  It is ok
765b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * for us to treat them the same and requeue them
766b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * as well.
767b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 */
768b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow
7690f398a8403e31c737b429fddc3850093d0bf58d0Mikulas Patocka	while ((bio = bio_list_pop(failures))) {
7700f398a8403e31c737b429fddc3850093d0bf58d0Mikulas Patocka		if (ms->log_failure)
7710f398a8403e31c737b429fddc3850093d0bf58d0Mikulas Patocka			hold_bio(ms, bio);
7720f398a8403e31c737b429fddc3850093d0bf58d0Mikulas Patocka		else {
7730f398a8403e31c737b429fddc3850093d0bf58d0Mikulas Patocka			ms->in_sync = 0;
7740f398a8403e31c737b429fddc3850093d0bf58d0Mikulas Patocka			dm_rh_mark_nosync(ms->rh, bio, bio->bi_size, 0);
7750f398a8403e31c737b429fddc3850093d0bf58d0Mikulas Patocka		}
776b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	}
77772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow}
77872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
77972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowstatic void trigger_event(struct work_struct *work)
78072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow{
78172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct mirror_set *ms =
78272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		container_of(work, struct mirror_set, trigger_event);
78372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
78472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	dm_table_event(ms->ti->table);
78572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow}
78672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
7871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*-----------------------------------------------------------------
7881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * kmirrord
7891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/
790a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patockastatic void do_mirror(struct work_struct *work)
7911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
7921f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct mirror_set *ms = container_of(work, struct mirror_set,
7931f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen					     kmirrord_work);
79472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct bio_list reads, writes, failures;
79572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	unsigned long flags;
7961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
79772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	spin_lock_irqsave(&ms->lock, flags);
7981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	reads = ms->reads;
7991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	writes = ms->writes;
80072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	failures = ms->failures;
8011da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	bio_list_init(&ms->reads);
8021da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	bio_list_init(&ms->writes);
80372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	bio_list_init(&ms->failures);
80472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	spin_unlock_irqrestore(&ms->lock, flags);
8051da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8061f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_rh_update_states(ms->rh, errors_handled(ms));
8071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	do_recovery(ms);
8081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	do_reads(ms, &reads);
8091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	do_writes(ms, &writes);
81072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	do_failures(ms, &failures);
8117ff14a36159d947872870e7a3e9dcaebc46b23ebMikulas Patocka
8127ff14a36159d947872870e7a3e9dcaebc46b23ebMikulas Patocka	dm_table_unplug_all(ms->ti->table);
8131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
8141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*-----------------------------------------------------------------
8161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Target functions
8171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/
8181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic struct mirror_set *alloc_context(unsigned int nr_mirrors,
8191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds					uint32_t region_size,
8201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds					struct dm_target *ti,
821416cd17b1982217bca3dc41b9f00b0b38fdaadadHeinz Mauelshagen					struct dm_dirty_log *dl)
8221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
8231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	size_t len;
8241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms = NULL;
8251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	len = sizeof(*ms) + (sizeof(ms->mirror[0]) * nr_mirrors);
8271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
828dd00cc486ab1c17049a535413d1751ef3482141cYoann Padioleau	ms = kzalloc(len, GFP_KERNEL);
8291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (!ms) {
83072d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Cannot allocate mirror context";
8311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return NULL;
8321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
8331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	spin_lock_init(&ms->lock);
8351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	ms->ti = ti;
8371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	ms->nr_mirrors = nr_mirrors;
8381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	ms->nr_regions = dm_sector_div_up(ti->len, region_size);
8391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	ms->in_sync = 0;
840b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	ms->log_failure = 0;
841b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	atomic_set(&ms->suspend, 0);
84272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	atomic_set(&ms->default_mirror, DEFAULT_MIRROR);
8431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
84495f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	ms->read_record_pool = mempool_create_slab_pool(MIN_READ_RECORDS,
84595f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka						_dm_raid1_read_record_cache);
84695f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka
84706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (!ms->read_record_pool) {
84806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		ti->error = "Error creating mirror read_record_pool";
84906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		kfree(ms);
85006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		return NULL;
85106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	}
85206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
85388be163abb5324bab09f5eff9646590eec5314ebMilan Broz	ms->io_client = dm_io_client_create(DM_IO_PAGES);
85488be163abb5324bab09f5eff9646590eec5314ebMilan Broz	if (IS_ERR(ms->io_client)) {
85588be163abb5324bab09f5eff9646590eec5314ebMilan Broz		ti->error = "Error creating dm_io client";
85606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		mempool_destroy(ms->read_record_pool);
85788be163abb5324bab09f5eff9646590eec5314ebMilan Broz		kfree(ms);
85888be163abb5324bab09f5eff9646590eec5314ebMilan Broz 		return NULL;
85988be163abb5324bab09f5eff9646590eec5314ebMilan Broz	}
86088be163abb5324bab09f5eff9646590eec5314ebMilan Broz
8611f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	ms->rh = dm_region_hash_create(ms, dispatch_bios, wakeup_mirrord,
8621f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen				       wakeup_all_recovery_waiters,
8631f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen				       ms->ti->begin, MAX_RECOVERY,
8641f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen				       dl, region_size, ms->nr_regions);
8651f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	if (IS_ERR(ms->rh)) {
86672d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Error creating dirty region hash";
867a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov		dm_io_client_destroy(ms->io_client);
86806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		mempool_destroy(ms->read_record_pool);
8691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		kfree(ms);
8701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return NULL;
8711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
8721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	return ms;
8741da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
8751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void free_context(struct mirror_set *ms, struct dm_target *ti,
8771da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			 unsigned int m)
8781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
8791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	while (m--)
8801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		dm_put_device(ti, ms->mirror[m].dev);
8811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
88288be163abb5324bab09f5eff9646590eec5314ebMilan Broz	dm_io_client_destroy(ms->io_client);
8831f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_region_hash_destroy(ms->rh);
88406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	mempool_destroy(ms->read_record_pool);
8851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	kfree(ms);
8861da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
8871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int get_mirror(struct mirror_set *ms, struct dm_target *ti,
8891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		      unsigned int mirror, char **argv)
8901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
8914ee218cd67b385759993a6c840ea45f0ee0a8b30Andrew Morton	unsigned long long offset;
8921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8934ee218cd67b385759993a6c840ea45f0ee0a8b30Andrew Morton	if (sscanf(argv[1], "%llu", &offset) != 1) {
89472d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Invalid offset";
8951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return -EINVAL;
8961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
8971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (dm_get_device(ti, argv[0], offset, ti->len,
8991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			  dm_table_get_mode(ti->table),
9001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			  &ms->mirror[mirror].dev)) {
90172d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Device lookup failure";
9021da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return -ENXIO;
9031da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
9041da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
905aa5617c55357d86c9082ba1d66fa9795370c9954Jonathan Brassow	ms->mirror[mirror].ms = ms;
90672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	atomic_set(&(ms->mirror[mirror].error_count), 0);
90772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	ms->mirror[mirror].error_type = 0;
9081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	ms->mirror[mirror].offset = offset;
9091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	return 0;
9111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
9121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*
9141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Create dirty log: log_type #log_params <log_params>
9151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */
916416cd17b1982217bca3dc41b9f00b0b38fdaadadHeinz Mauelshagenstatic struct dm_dirty_log *create_dirty_log(struct dm_target *ti,
9171f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen					     unsigned argc, char **argv,
9181f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen					     unsigned *args_used)
9191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
9201f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	unsigned param_count;
921416cd17b1982217bca3dc41b9f00b0b38fdaadadHeinz Mauelshagen	struct dm_dirty_log *dl;
9221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (argc < 2) {
92472d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Insufficient mirror log arguments";
9251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return NULL;
9261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
9271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (sscanf(argv[1], "%u", &param_count) != 1) {
92972d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Invalid mirror log argument count";
9301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return NULL;
9311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
9321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	*args_used = 2 + param_count;
9341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (argc < *args_used) {
93672d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Insufficient mirror log arguments";
9371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return NULL;
9381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
9391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
940c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	dl = dm_dirty_log_create(argv[0], ti, mirror_flush, param_count,
941c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka				 argv + 2);
9421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (!dl) {
94372d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Error creating mirror dirty log";
9441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return NULL;
9451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
9461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	return dl;
9481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
9491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
950a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassowstatic int parse_features(struct mirror_set *ms, unsigned argc, char **argv,
951a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow			  unsigned *args_used)
952a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow{
953a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	unsigned num_features;
954a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	struct dm_target *ti = ms->ti;
955a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
956a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	*args_used = 0;
957a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
958a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	if (!argc)
959a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		return 0;
960a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
961a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	if (sscanf(argv[0], "%u", &num_features) != 1) {
962a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		ti->error = "Invalid number of features";
963a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		return -EINVAL;
964a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	}
965a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
966a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	argc--;
967a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	argv++;
968a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	(*args_used)++;
969a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
970a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	if (num_features > argc) {
971a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		ti->error = "Not enough arguments to support feature count";
972a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		return -EINVAL;
973a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	}
974a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
975a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	if (!strcmp("handle_errors", argv[0]))
976a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		ms->features |= DM_RAID1_HANDLE_ERRORS;
977a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	else {
978a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		ti->error = "Unrecognised feature requested";
979a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		return -EINVAL;
980a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	}
981a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
982a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	(*args_used)++;
983a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
984a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	return 0;
985a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow}
986a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
9871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*
9881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Construct a mirror mapping:
9891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *
9901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * log_type #log_params <log_params>
9911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * #mirrors [mirror_path offset]{2,}
992a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow * [#features <features>]
9931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *
9941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * log_type is "core" or "disk"
9951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * #log_params is between 1 and 3
996a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow *
997a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow * If present, features must be "handle_errors".
9981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */
9991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int mirror_ctr(struct dm_target *ti, unsigned int argc, char **argv)
10001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
10011da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int r;
10021da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	unsigned int nr_mirrors, m, args_used;
10031da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms;
1004416cd17b1982217bca3dc41b9f00b0b38fdaadadHeinz Mauelshagen	struct dm_dirty_log *dl;
10051da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10061da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	dl = create_dirty_log(ti, argc, argv, &args_used);
10071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (!dl)
10081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return -EINVAL;
10091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	argv += args_used;
10111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	argc -= args_used;
10121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (!argc || sscanf(argv[0], "%u", &nr_mirrors) != 1 ||
1014eb69aca5d3370b81450d68edeebc2bb9a3eb9689Heinz Mauelshagen	    nr_mirrors < 2 || nr_mirrors > DM_KCOPYD_MAX_REGIONS + 1) {
101572d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Invalid number of mirrors";
1016416cd17b1982217bca3dc41b9f00b0b38fdaadadHeinz Mauelshagen		dm_dirty_log_destroy(dl);
10171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return -EINVAL;
10181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
10191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	argv++, argc--;
10211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1022a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	if (argc < nr_mirrors * 2) {
1023a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		ti->error = "Too few mirror arguments";
1024416cd17b1982217bca3dc41b9f00b0b38fdaadadHeinz Mauelshagen		dm_dirty_log_destroy(dl);
10251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return -EINVAL;
10261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
10271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	ms = alloc_context(nr_mirrors, dl->type->get_region_size(dl), ti, dl);
10291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (!ms) {
1030416cd17b1982217bca3dc41b9f00b0b38fdaadadHeinz Mauelshagen		dm_dirty_log_destroy(dl);
10311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return -ENOMEM;
10321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
10331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/* Get the mirror parameter sets */
10351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	for (m = 0; m < nr_mirrors; m++) {
10361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		r = get_mirror(ms, ti, m, argv);
10371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		if (r) {
10381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			free_context(ms, ti, m);
10391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			return r;
10401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		}
10411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		argv += 2;
10421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		argc -= 2;
10431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
10441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	ti->private = ms;
10461f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	ti->split_io = dm_rh_get_region_size(ms->rh);
10474184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka	ti->num_flush_requests = 1;
10481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10496ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	ms->kmirrord_wq = create_singlethread_workqueue("kmirrord");
10506ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	if (!ms->kmirrord_wq) {
10516ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski		DMERR("couldn't start kmirrord");
1052a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov		r = -ENOMEM;
1053a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov		goto err_free_context;
10546ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	}
10556ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	INIT_WORK(&ms->kmirrord_work, do_mirror);
1056a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	init_timer(&ms->timer);
1057a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	ms->timer_pending = 0;
105872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	INIT_WORK(&ms->trigger_event, trigger_event);
10596ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski
1060a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	r = parse_features(ms, argc, argv, &args_used);
1061a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov	if (r)
1062a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov		goto err_destroy_wq;
1063a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
1064a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	argv += args_used;
1065a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	argc -= args_used;
1066a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
1067f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	/*
1068f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	 * Any read-balancing addition depends on the
1069f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	 * DM_RAID1_HANDLE_ERRORS flag being present.
1070f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	 * This is because the decision to balance depends
1071f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	 * on the sync state of a region.  If the above
1072f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	 * flag is not present, we ignore errors; and
1073f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	 * the sync state may be inaccurate.
1074f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	 */
1075f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow
1076a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	if (argc) {
1077a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		ti->error = "Too many mirror arguments";
1078a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov		r = -EINVAL;
1079a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov		goto err_destroy_wq;
1080a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	}
1081a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
10821f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	r = dm_kcopyd_client_create(DM_KCOPYD_PAGES, &ms->kcopyd_client);
1083a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov	if (r)
1084a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov		goto err_destroy_wq;
10851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10861f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	wakeup_mirrord(ms);
10871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	return 0;
1088a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov
1089a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhoverr_destroy_wq:
1090a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov	destroy_workqueue(ms->kmirrord_wq);
1091a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhoverr_free_context:
1092a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov	free_context(ms, ti, ms->nr_mirrors);
1093a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov	return r;
10941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
10951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void mirror_dtr(struct dm_target *ti)
10971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
10981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms = (struct mirror_set *) ti->private;
10991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1100a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	del_timer_sync(&ms->timer);
11016ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	flush_workqueue(ms->kmirrord_wq);
110218776c7316545482a02bfaa2629a2aa1afc48357Mikulas Patocka	flush_scheduled_work();
1103eb69aca5d3370b81450d68edeebc2bb9a3eb9689Heinz Mauelshagen	dm_kcopyd_client_destroy(ms->kcopyd_client);
11046ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	destroy_workqueue(ms->kmirrord_wq);
11051da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	free_context(ms, ti, ms->nr_mirrors);
11061da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
11071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*
11091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Mirror mapping function
11101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */
11111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int mirror_map(struct dm_target *ti, struct bio *bio,
11121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		      union map_info *map_context)
11131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
11141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int r, rw = bio_rw(bio);
11151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror *m;
11161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms = ti->private;
111706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct dm_raid1_read_record *read_record = NULL;
11181f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
11191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (rw == WRITE) {
112106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		/* Save region for mirror_end_io() handler */
11221f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		map_context->ll = dm_rh_bio_to_region(ms->rh, bio);
11231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		queue_bio(ms, bio, rw);
1124d2a7ad29a810441e9dacbaddcc2f0c6045390008Kiyoshi Ueda		return DM_MAPIO_SUBMITTED;
11251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
11261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11271f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	r = log->type->in_sync(log, dm_rh_bio_to_region(ms->rh, bio), 0);
11281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (r < 0 && r != -EWOULDBLOCK)
11291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return r;
11301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
113206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	 * If region is not in-sync queue the bio.
11331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
113406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (!r || (r == -EWOULDBLOCK)) {
113506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		if (rw == READA)
113606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			return -EWOULDBLOCK;
11371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		queue_bio(ms, bio, rw);
1139d2a7ad29a810441e9dacbaddcc2f0c6045390008Kiyoshi Ueda		return DM_MAPIO_SUBMITTED;
11401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
11411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
114206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	/*
114306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	 * The region is in-sync and we can perform reads directly.
114406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	 * Store enough information so we can retry if it fails.
114506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	 */
11461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	m = choose_mirror(ms, bio->bi_sector);
114706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (unlikely(!m))
11481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return -EIO;
11491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
115006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	read_record = mempool_alloc(ms->read_record_pool, GFP_NOIO);
115106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (likely(read_record)) {
115206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		dm_bio_record(&read_record->details, bio);
115306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		map_context->ptr = read_record;
115406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		read_record->m = m;
115506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	}
115606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
115706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	map_bio(m, bio);
115806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
1159d2a7ad29a810441e9dacbaddcc2f0c6045390008Kiyoshi Ueda	return DM_MAPIO_REMAPPED;
11601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
11611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int mirror_end_io(struct dm_target *ti, struct bio *bio,
11631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			 int error, union map_info *map_context)
11641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
11651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int rw = bio_rw(bio);
11661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms = (struct mirror_set *) ti->private;
116706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct mirror *m = NULL;
116806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct dm_bio_details *bd = NULL;
116906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct dm_raid1_read_record *read_record = map_context->ptr;
11701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
11721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * We need to dec pending if this was a write.
11731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
117406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (rw == WRITE) {
11754184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka		if (likely(!bio_empty_barrier(bio)))
11764184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka			dm_rh_dec(ms->rh, map_context->ll);
117706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		return error;
117806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	}
11791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
118006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (error == -EOPNOTSUPP)
118106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		goto out;
118206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
11831f98a13f623e0ef666690a18c1250335fc6d7ef1Jens Axboe	if ((error == -EWOULDBLOCK) && bio_rw_flagged(bio, BIO_RW_AHEAD))
118406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		goto out;
118506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
118606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (unlikely(error)) {
118706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		if (!read_record) {
118806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			/*
118906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			 * There wasn't enough memory to record necessary
119006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			 * information for a retry or there was no other
119106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			 * mirror in-sync.
119206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			 */
1193e03f1a842287480aa03732612148c0d333baca61Adrian Bunk			DMERR_LIMIT("Mirror read failed.");
119406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			return -EIO;
119506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		}
1196e03f1a842287480aa03732612148c0d333baca61Adrian Bunk
1197e03f1a842287480aa03732612148c0d333baca61Adrian Bunk		m = read_record->m;
1198e03f1a842287480aa03732612148c0d333baca61Adrian Bunk
119906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		DMERR("Mirror read failed from %s. Trying alternative device.",
120006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		      m->dev->name);
120106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
120206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		fail_mirror(m, DM_RAID1_READ_ERROR);
120306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
120406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		/*
120506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		 * A failed read is requeued for another attempt using an intact
120606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		 * mirror.
120706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		 */
120806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		if (default_ok(m) || mirror_available(ms, bio)) {
120906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			bd = &read_record->details;
121006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
121106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			dm_bio_restore(bd, bio);
121206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			mempool_free(read_record, ms->read_record_pool);
121306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			map_context->ptr = NULL;
121406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			queue_bio(ms, bio, rw);
121506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			return 1;
121606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		}
121706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		DMERR("All replicated volumes dead, failing I/O");
121806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	}
121906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
122006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowout:
122106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (read_record) {
122206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		mempool_free(read_record, ms->read_record_pool);
122306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		map_context->ptr = NULL;
122406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	}
122506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
122606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	return error;
12271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
12281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1229b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassowstatic void mirror_presuspend(struct dm_target *ti)
12301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
12311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms = (struct mirror_set *) ti->private;
12321f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
12331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
123404788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	struct bio_list holds;
123504788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	struct bio *bio;
123604788507686d184d8166918b70ef52311bc36dcbMikulas Patocka
1237b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	atomic_set(&ms->suspend, 1);
1238b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow
1239b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	/*
1240b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * We must finish up all the work that we've
1241b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * generated (i.e. recovery work).
1242b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 */
12431f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_rh_stop_recovery(ms->rh);
124433184048dc4f9d5550d3b6a88c8e0ff92033eb6eJonathan E Brassow
124533184048dc4f9d5550d3b6a88c8e0ff92033eb6eJonathan E Brassow	wait_event(_kmirrord_recovery_stopped,
12461f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		   !dm_rh_recovery_in_flight(ms->rh));
124733184048dc4f9d5550d3b6a88c8e0ff92033eb6eJonathan E Brassow
1248b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	if (log->type->presuspend && log->type->presuspend(log))
1249b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow		/* FIXME: need better error handling */
1250b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow		DMWARN("log presuspend failed");
1251b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow
1252b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	/*
1253b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * Now that recovery is complete/stopped and the
1254b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * delayed bios are queued, we need to wait for
1255b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * the worker thread to complete.  This way,
1256b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * we know that all of our I/O has been pushed.
1257b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 */
1258b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	flush_workqueue(ms->kmirrord_wq);
125904788507686d184d8166918b70ef52311bc36dcbMikulas Patocka
126004788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	/*
126104788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 * Now set ms->suspend is set and the workqueue flushed, no more
126204788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 * entries can be added to ms->hold list, so process it.
126304788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 *
126404788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 * Bios can still arrive concurrently with or after this
126504788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 * presuspend function, but they cannot join the hold list
126604788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 * because ms->suspend is set.
126704788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 */
126804788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	spin_lock_irq(&ms->lock);
126904788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	holds = ms->holds;
127004788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	bio_list_init(&ms->holds);
127104788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	spin_unlock_irq(&ms->lock);
127204788507686d184d8166918b70ef52311bc36dcbMikulas Patocka
127304788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	while ((bio = bio_list_pop(&holds)))
127404788507686d184d8166918b70ef52311bc36dcbMikulas Patocka		hold_bio(ms, bio);
1275b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow}
1276b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow
1277b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassowstatic void mirror_postsuspend(struct dm_target *ti)
1278b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow{
1279b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	struct mirror_set *ms = ti->private;
12801f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
1281b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow
12826b3df0d7a5e85ad2afd3eecc50e2dee59e876ae8Jonathan Brassow	if (log->type->postsuspend && log->type->postsuspend(log))
12831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		/* FIXME: need better error handling */
1284b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow		DMWARN("log postsuspend failed");
12851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
12861da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
12871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void mirror_resume(struct dm_target *ti)
12881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
1289b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	struct mirror_set *ms = ti->private;
12901f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
1291b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow
1292b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	atomic_set(&ms->suspend, 0);
12931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (log->type->resume && log->type->resume(log))
12941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		/* FIXME: need better error handling */
12951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		DMWARN("log resume failed");
12961f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_rh_start_recovery(ms->rh);
12971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
12981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1299af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow/*
1300af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow * device_status_char
1301af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow * @m: mirror device/leg we want the status of
1302af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow *
1303af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow * We return one character representing the most severe error
1304af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow * we have encountered.
1305af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow *    A => Alive - No failures
1306af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow *    D => Dead - A write failure occurred leaving mirror out-of-sync
1307af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow *    S => Sync - A sychronization failure occurred, mirror out-of-sync
1308af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow *    R => Read - A read failure occurred, mirror data unaffected
1309af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow *
1310af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow * Returns: <char>
1311af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow */
1312af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassowstatic char device_status_char(struct mirror *m)
1313af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow{
1314af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow	if (!atomic_read(&(m->error_count)))
1315af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		return 'A';
1316af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow
131764b30c46e866bbff8a9e17883a18636adc358455Mikulas Patocka	return (test_bit(DM_RAID1_FLUSH_ERROR, &(m->error_type))) ? 'F' :
131864b30c46e866bbff8a9e17883a18636adc358455Mikulas Patocka		(test_bit(DM_RAID1_WRITE_ERROR, &(m->error_type))) ? 'D' :
1319af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		(test_bit(DM_RAID1_SYNC_ERROR, &(m->error_type))) ? 'S' :
1320af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		(test_bit(DM_RAID1_READ_ERROR, &(m->error_type))) ? 'R' : 'U';
1321af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow}
1322af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow
1323af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow
13241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int mirror_status(struct dm_target *ti, status_type_t type,
13251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			 char *result, unsigned int maxlen)
13261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
1327315dcc226f066c1d3cef79283dcde807fe0e32d1Jonathan E Brassow	unsigned int m, sz = 0;
13281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms = (struct mirror_set *) ti->private;
13291f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
1330af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow	char buffer[ms->nr_mirrors + 1];
13311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
13321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	switch (type) {
13331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	case STATUSTYPE_INFO:
13341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		DMEMIT("%d ", ms->nr_mirrors);
1335af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		for (m = 0; m < ms->nr_mirrors; m++) {
13361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			DMEMIT("%s ", ms->mirror[m].dev->name);
1337af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow			buffer[m] = device_status_char(&(ms->mirror[m]));
1338af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		}
1339af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		buffer[m] = '\0';
13401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1341af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		DMEMIT("%llu/%llu 1 %s ",
13421f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		      (unsigned long long)log->type->get_sync_count(log),
1343af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		      (unsigned long long)ms->nr_regions, buffer);
1344315dcc226f066c1d3cef79283dcde807fe0e32d1Jonathan E Brassow
13451f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		sz += log->type->status(log, type, result+sz, maxlen-sz);
1346315dcc226f066c1d3cef79283dcde807fe0e32d1Jonathan E Brassow
13471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		break;
13481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
13491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	case STATUSTYPE_TABLE:
13501f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		sz = log->type->status(log, type, result, maxlen);
1351315dcc226f066c1d3cef79283dcde807fe0e32d1Jonathan E Brassow
1352e52b8f6dbe18c879ad2b5013f991ec9e46813043Jonathan Brassow		DMEMIT("%d", ms->nr_mirrors);
13531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		for (m = 0; m < ms->nr_mirrors; m++)
1354e52b8f6dbe18c879ad2b5013f991ec9e46813043Jonathan Brassow			DMEMIT(" %s %llu", ms->mirror[m].dev->name,
1355b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow			       (unsigned long long)ms->mirror[m].offset);
1356a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
1357a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		if (ms->features & DM_RAID1_HANDLE_ERRORS)
1358a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow			DMEMIT(" 1 handle_errors");
13591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
13601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
13611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	return 0;
13621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
13631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1364af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzerstatic int mirror_iterate_devices(struct dm_target *ti,
1365af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer				  iterate_devices_callout_fn fn, void *data)
1366af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer{
1367af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer	struct mirror_set *ms = ti->private;
1368af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer	int ret = 0;
1369af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer	unsigned i;
1370af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer
1371af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer	for (i = 0; !ret && i < ms->nr_mirrors; i++)
1372af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer		ret = fn(ti, ms->mirror[i].dev,
13735dea271b6d87bd1d79a59c1d5baac2596a841c37Mike Snitzer			 ms->mirror[i].offset, ti->len, data);
1374af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer
1375af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer	return ret;
1376af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer}
1377af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer
13781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic struct target_type mirror_target = {
13791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.name	 = "mirror",
1380af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer	.version = {1, 12, 0},
13811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.module	 = THIS_MODULE,
13821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.ctr	 = mirror_ctr,
13831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.dtr	 = mirror_dtr,
13841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.map	 = mirror_map,
13851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.end_io	 = mirror_end_io,
1386b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	.presuspend = mirror_presuspend,
13871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.postsuspend = mirror_postsuspend,
13881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.resume	 = mirror_resume,
13891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.status	 = mirror_status,
1390af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer	.iterate_devices = mirror_iterate_devices,
13911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds};
13921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
13931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int __init dm_mirror_init(void)
13941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
13951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int r;
13961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
139795f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	_dm_raid1_read_record_cache = KMEM_CACHE(dm_raid1_read_record, 0);
139895f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	if (!_dm_raid1_read_record_cache) {
139995f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka		DMERR("Can't allocate dm_raid1_read_record cache");
140095f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka		r = -ENOMEM;
140195f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka		goto bad_cache;
140295f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	}
140395f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka
14041da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	r = dm_register_target(&mirror_target);
140595f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	if (r < 0) {
14060cd3312434cd1f29bee6bff53bf2790d733ad2a2Alasdair G Kergon		DMERR("Failed to register mirror target");
140795f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka		goto bad_target;
140895f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	}
140995f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka
141095f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	return 0;
14111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
141295f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patockabad_target:
141395f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	kmem_cache_destroy(_dm_raid1_read_record_cache);
141495f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patockabad_cache:
14151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	return r;
14161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
14171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
14181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void __exit dm_mirror_exit(void)
14191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
142010d3bd09a3c25df114f74f7f86e1b58d070bef32Mikulas Patocka	dm_unregister_target(&mirror_target);
142195f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	kmem_cache_destroy(_dm_raid1_read_record_cache);
14221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
14231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
14241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/* Module hooks */
14251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsmodule_init(dm_mirror_init);
14261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsmodule_exit(dm_mirror_exit);
14271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
14281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus TorvaldsMODULE_DESCRIPTION(DM_NAME " mirror target");
14291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus TorvaldsMODULE_AUTHOR("Joe Thornber");
14301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus TorvaldsMODULE_LICENSE("GPL");
1431