11da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*
21da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Copyright (C) 2003 Sistina Software Limited.
31f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen * Copyright (C) 2005-2008 Red Hat, Inc. All rights reserved.
41da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *
51da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * This file is released under the GPL.
61da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */
71da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow#include "dm-bio-record.h"
91da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/init.h>
111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/mempool.h>
121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/module.h>
131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/pagemap.h>
141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/slab.h>
151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/workqueue.h>
161f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen#include <linux/device-mapper.h>
17a765e20eeb423d0fa6a02ffab51141e53bbd93cbAlasdair G Kergon#include <linux/dm-io.h>
18a765e20eeb423d0fa6a02ffab51141e53bbd93cbAlasdair G Kergon#include <linux/dm-dirty-log.h>
19a765e20eeb423d0fa6a02ffab51141e53bbd93cbAlasdair G Kergon#include <linux/dm-kcopyd.h>
201f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen#include <linux/dm-region-hash.h>
211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
2272d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon#define DM_MSG_PREFIX "raid1"
231f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen
241f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen#define MAX_RECOVERY 1	/* Maximum number of regions recovered in parallel. */
2572d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon
26a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow#define DM_RAID1_HANDLE_ERRORS 0x01
27f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow#define errors_handled(p)	((p)->features & DM_RAID1_HANDLE_ERRORS)
28a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
2933184048dc4f9d5550d3b6a88c8e0ff92033eb6eJonathan E Brassowstatic DECLARE_WAIT_QUEUE_HEAD(_kmirrord_recovery_stopped);
301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*-----------------------------------------------------------------
32e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown * Mirror set structures.
33e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown *---------------------------------------------------------------*/
3472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowenum dm_raid1_error {
3572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	DM_RAID1_WRITE_ERROR,
3664b30c46e866bbff8a9e17883a18636adc358455Mikulas Patocka	DM_RAID1_FLUSH_ERROR,
3772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	DM_RAID1_SYNC_ERROR,
3872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	DM_RAID1_READ_ERROR
3972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow};
4072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
41e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brownstruct mirror {
42aa5617c55357d86c9082ba1d66fa9795370c9954Jonathan Brassow	struct mirror_set *ms;
43e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	atomic_t error_count;
4439ed7adb17bdec8224bd3fae551bb7222e05f35bAl Viro	unsigned long error_type;
45e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	struct dm_dev *dev;
46e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	sector_t offset;
47e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown};
48e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown
49e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brownstruct mirror_set {
50e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	struct dm_target *ti;
51e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	struct list_head list;
521f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen
53a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	uint64_t features;
54e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown
5572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	spinlock_t lock;	/* protects the lists */
56e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	struct bio_list reads;
57e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	struct bio_list writes;
5872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct bio_list failures;
5904788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	struct bio_list holds;	/* bios are waiting until suspend */
60e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown
611f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_region_hash *rh;
621f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_kcopyd_client *kcopyd_client;
6388be163abb5324bab09f5eff9646590eec5314ebMilan Broz	struct dm_io_client *io_client;
6406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	mempool_t *read_record_pool;
6588be163abb5324bab09f5eff9646590eec5314ebMilan Broz
66e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	/* recovery */
67e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	region_t nr_regions;
68e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	int in_sync;
69fc1ff9588a6d56258ff9576a31aa34f17757c666Jonathan Brassow	int log_failure;
70929be8fcb4b4b65d038e73d3bb34715851a95ca2Mikulas Patocka	int leg_failure;
71b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	atomic_t suspend;
72e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown
7372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	atomic_t default_mirror;	/* Default mirror */
74e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown
756ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	struct workqueue_struct *kmirrord_wq;
766ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	struct work_struct kmirrord_work;
77a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	struct timer_list timer;
78a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	unsigned long timer_pending;
79a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka
8072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct work_struct trigger_event;
816ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski
821f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	unsigned nr_mirrors;
83e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown	struct mirror mirror[0];
84e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown};
85e4c8b3ba34cc1aeab451c7a5cc843c5fd62cbe3dNeil Brown
861f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagenstatic void wakeup_mirrord(void *context)
871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
881f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct mirror_set *ms = context;
891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
906ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	queue_work(ms->kmirrord_wq, &ms->kmirrord_work);
916ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski}
926ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski
93a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patockastatic void delayed_wake_fn(unsigned long data)
94a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka{
95a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	struct mirror_set *ms = (struct mirror_set *) data;
96a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka
97a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	clear_bit(0, &ms->timer_pending);
981f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	wakeup_mirrord(ms);
99a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka}
100a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka
101a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patockastatic void delayed_wake(struct mirror_set *ms)
102a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka{
103a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	if (test_and_set_bit(0, &ms->timer_pending))
104a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka		return;
105a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka
106a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	ms->timer.expires = jiffies + HZ / 5;
107a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	ms->timer.data = (unsigned long) ms;
108a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	ms->timer.function = delayed_wake_fn;
109a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	add_timer(&ms->timer);
110a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka}
111a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka
1121f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagenstatic void wakeup_all_recovery_waiters(void *context)
1131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
1141f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	wake_up_all(&_kmirrord_recovery_stopped);
1151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
1161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1171f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagenstatic void queue_bio(struct mirror_set *ms, struct bio *bio, int rw)
1181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
1191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	unsigned long flags;
1201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int should_wake = 0;
1211f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct bio_list *bl;
1221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1231f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	bl = (rw == WRITE) ? &ms->writes : &ms->reads;
1241f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	spin_lock_irqsave(&ms->lock, flags);
1251f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	should_wake = !(bl->head);
1261f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	bio_list_add(bl, bio);
1271f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	spin_unlock_irqrestore(&ms->lock, flags);
1281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (should_wake)
1301f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		wakeup_mirrord(ms);
1311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
1321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1331f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagenstatic void dispatch_bios(void *context, struct bio_list *bio_list)
1341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
1351f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct mirror_set *ms = context;
1361f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct bio *bio;
1371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1381f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	while ((bio = bio_list_pop(bio_list)))
1391f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		queue_bio(ms, bio, WRITE);
1401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
1411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
14206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow#define MIN_READ_RECORDS 20
14306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstruct dm_raid1_read_record {
14406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct mirror *m;
14506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct dm_bio_details details;
14606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow};
14706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
14895f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patockastatic struct kmem_cache *_dm_raid1_read_record_cache;
14995f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka
1501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*
1511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Every mirror should look like this one.
1521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */
1531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#define DEFAULT_MIRROR 0
1541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*
15606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow * This is yucky.  We squirrel the mirror struct away inside
15706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow * bi_next for read/write buffers.  This is safe since the bh
1581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * doesn't get submitted to the lower levels of block layer.
1591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */
16006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic struct mirror *bio_get_m(struct bio *bio)
1611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
16206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	return (struct mirror *) bio->bi_next;
1631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
1641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
16506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic void bio_set_m(struct bio *bio, struct mirror *m)
1661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
16706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	bio->bi_next = (struct bio *) m;
1681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
1691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
17072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowstatic struct mirror *get_default_mirror(struct mirror_set *ms)
17172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow{
17272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	return &ms->mirror[atomic_read(&ms->default_mirror)];
17372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow}
17472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
17572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowstatic void set_default_mirror(struct mirror *m)
17672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow{
17772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct mirror_set *ms = m->ms;
17872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct mirror *m0 = &(ms->mirror[0]);
17972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
18072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	atomic_set(&ms->default_mirror, m - m0);
18172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow}
18272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
18387968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patockastatic struct mirror *get_valid_mirror(struct mirror_set *ms)
18487968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka{
18587968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka	struct mirror *m;
18687968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka
18787968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka	for (m = ms->mirror; m < ms->mirror + ms->nr_mirrors; m++)
18887968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka		if (!atomic_read(&m->error_count))
18987968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka			return m;
19087968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka
19187968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka	return NULL;
19287968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka}
19387968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka
19472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow/* fail_mirror
19572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * @m: mirror device to fail
19672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * @error_type: one of the enum's, DM_RAID1_*_ERROR
19772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow *
19872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * If errors are being handled, record the type of
19972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * error encountered for this device.  If this type
20072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * of error has already been recorded, we can return;
20172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * otherwise, we must signal userspace by triggering
20272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * an event.  Additionally, if the device is the
20372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * primary device, we must choose a new primary, but
20472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * only if the mirror is in-sync.
20572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow *
20672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow * This function must not block.
20772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow */
20872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowstatic void fail_mirror(struct mirror *m, enum dm_raid1_error error_type)
20972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow{
21072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct mirror_set *ms = m->ms;
21172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct mirror *new;
21272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
213929be8fcb4b4b65d038e73d3bb34715851a95ca2Mikulas Patocka	ms->leg_failure = 1;
214929be8fcb4b4b65d038e73d3bb34715851a95ca2Mikulas Patocka
21572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	/*
21672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	 * error_count is used for nothing more than a
21772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	 * simple way to tell if a device has encountered
21872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	 * errors.
21972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	 */
22072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	atomic_inc(&m->error_count);
22172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
22272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	if (test_and_set_bit(error_type, &m->error_type))
22372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		return;
22472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
225d460c65a6a9ec9e0d284864ec3a9a2d1b73f0e43Jonathan Brassow	if (!errors_handled(ms))
226d460c65a6a9ec9e0d284864ec3a9a2d1b73f0e43Jonathan Brassow		return;
227d460c65a6a9ec9e0d284864ec3a9a2d1b73f0e43Jonathan Brassow
22872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	if (m != get_default_mirror(ms))
22972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		goto out;
23072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
23172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	if (!ms->in_sync) {
23272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		/*
23372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		 * Better to issue requests to same failing device
23472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		 * than to risk returning corrupt data.
23572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		 */
23672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		DMERR("Primary mirror (%s) failed while out-of-sync: "
23772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		      "Reads may fail.", m->dev->name);
23872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		goto out;
23972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	}
24072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
24187968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka	new = get_valid_mirror(ms);
24287968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka	if (new)
24387968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka		set_default_mirror(new);
24487968ddd2f3be1c21b932cac30157a83a1c4f935Mikulas Patocka	else
24572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		DMWARN("All sides of mirror have failed.");
24672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
24772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowout:
24872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	schedule_work(&ms->trigger_event);
24972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow}
25072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
251c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patockastatic int mirror_flush(struct dm_target *ti)
252c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka{
253c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	struct mirror_set *ms = ti->private;
254c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	unsigned long error_bits;
255c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka
256c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	unsigned int i;
257c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	struct dm_io_region io[ms->nr_mirrors];
258c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	struct mirror *m;
259c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	struct dm_io_request io_req = {
260d87f4c14f27dc82d215108d8392a7d26687148a1Tejun Heo		.bi_rw = WRITE_FLUSH,
261c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		.mem.type = DM_IO_KMEM,
2625fc2ffeabb9ee0fc0e71ff16b49f34f0ed3d05b4Mike Snitzer		.mem.ptr.addr = NULL,
263c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		.client = ms->io_client,
264c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	};
265c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka
266c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	for (i = 0, m = ms->mirror; i < ms->nr_mirrors; i++, m++) {
267c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		io[i].bdev = m->dev->bdev;
268c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		io[i].sector = 0;
269c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		io[i].count = 0;
270c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	}
271c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka
272c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	error_bits = -1;
273c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	dm_io(&io_req, ms->nr_mirrors, io, &error_bits);
274c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	if (unlikely(error_bits != 0)) {
275c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		for (i = 0; i < ms->nr_mirrors; i++)
276c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka			if (test_bit(i, &error_bits))
277c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka				fail_mirror(ms->mirror + i,
27864b30c46e866bbff8a9e17883a18636adc358455Mikulas Patocka					    DM_RAID1_FLUSH_ERROR);
279c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka		return -EIO;
280c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	}
281c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka
282c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	return 0;
283c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka}
284c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka
2851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*-----------------------------------------------------------------
2861da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Recovery.
2871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *
2881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * When a mirror is first activated we may find that some regions
2891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * are in the no-sync state.  We have to recover these by
2901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * recopying from the default mirror to all the others.
2911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/
2924cdc1d1fa5c5ac14dc21be19832f02fd0b83867eAlasdair G Kergonstatic void recovery_complete(int read_err, unsigned long write_err,
2931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			      void *context)
2941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
2951f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_region *reg = context;
2961f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct mirror_set *ms = dm_rh_region_context(reg);
2978f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow	int m, bit = 0;
2981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
2998f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow	if (read_err) {
300f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow		/* Read error means the failure of default mirror. */
301f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow		DMERR_LIMIT("Unable to read primary mirror during recovery");
3028f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow		fail_mirror(get_default_mirror(ms), DM_RAID1_SYNC_ERROR);
3038f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow	}
304f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow
3058f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow	if (write_err) {
3064cdc1d1fa5c5ac14dc21be19832f02fd0b83867eAlasdair G Kergon		DMERR_LIMIT("Write error during recovery (error = 0x%lx)",
307f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow			    write_err);
3088f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow		/*
3098f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow		 * Bits correspond to devices (excluding default mirror).
3108f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow		 * The default mirror cannot change during recovery.
3118f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow		 */
3128f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow		for (m = 0; m < ms->nr_mirrors; m++) {
3138f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow			if (&ms->mirror[m] == get_default_mirror(ms))
3148f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow				continue;
3158f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow			if (test_bit(bit, &write_err))
3168f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow				fail_mirror(ms->mirror + m,
3178f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow					    DM_RAID1_SYNC_ERROR);
3188f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow			bit++;
3198f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow		}
3208f0205b798f926e2745de5fdebf0a8605c621de6Jonathan Brassow	}
321f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow
3221f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_rh_recovery_end(reg, !(read_err || write_err));
3231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
3241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3251f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagenstatic int recover(struct mirror_set *ms, struct dm_region *reg)
3261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
3271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int r;
3281f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	unsigned i;
329eb69aca5d3370b81450d68edeebc2bb9a3eb9689Heinz Mauelshagen	struct dm_io_region from, to[DM_KCOPYD_MAX_REGIONS], *dest;
3301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror *m;
3311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	unsigned long flags = 0;
3321f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	region_t key = dm_rh_get_region_key(reg);
3331f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	sector_t region_size = dm_rh_get_region_size(ms->rh);
3341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/* fill in the source */
33672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	m = get_default_mirror(ms);
3371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	from.bdev = m->dev->bdev;
3381f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	from.sector = m->offset + dm_rh_region_to_sector(ms->rh, key);
3391f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	if (key == (ms->nr_regions - 1)) {
3401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		/*
3411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		 * The final region may be smaller than
3421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		 * region_size.
3431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		 */
3441f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		from.count = ms->ti->len & (region_size - 1);
3451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		if (!from.count)
3461f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen			from.count = region_size;
3471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	} else
3481f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		from.count = region_size;
3491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/* fill in the destinations */
3511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	for (i = 0, dest = to; i < ms->nr_mirrors; i++) {
35272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		if (&ms->mirror[i] == get_default_mirror(ms))
3531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			continue;
3541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		m = ms->mirror + i;
3561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		dest->bdev = m->dev->bdev;
3571f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		dest->sector = m->offset + dm_rh_region_to_sector(ms->rh, key);
3581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		dest->count = from.count;
3591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		dest++;
3601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
3611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/* hand to kcopyd */
363f7c83e2e4783c4f7abe6f3a85a8c5e210f98bc7bJonathan Brassow	if (!errors_handled(ms))
364f7c83e2e4783c4f7abe6f3a85a8c5e210f98bc7bJonathan Brassow		set_bit(DM_KCOPYD_IGNORE_ERROR, &flags);
365f7c83e2e4783c4f7abe6f3a85a8c5e210f98bc7bJonathan Brassow
366eb69aca5d3370b81450d68edeebc2bb9a3eb9689Heinz Mauelshagen	r = dm_kcopyd_copy(ms->kcopyd_client, &from, ms->nr_mirrors - 1, to,
367eb69aca5d3370b81450d68edeebc2bb9a3eb9689Heinz Mauelshagen			   flags, recovery_complete, reg);
3681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	return r;
3701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
3711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void do_recovery(struct mirror_set *ms)
3731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
3741f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_region *reg;
3751f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
3761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int r;
3771da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
3791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * Start quiescing some regions.
3801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
3811f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_rh_recovery_prepare(ms->rh);
3821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
3841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * Copy any already quiesced regions.
3851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
3861f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	while ((reg = dm_rh_recovery_start(ms->rh))) {
3871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		r = recover(ms, reg);
3881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		if (r)
3891f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen			dm_rh_recovery_end(reg, 0);
3901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
3911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
3921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
3931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * Update the in sync flag.
3941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
3951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (!ms->in_sync &&
3961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	    (log->type->get_sync_count(log) == ms->nr_regions)) {
3971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		/* the sync is complete */
3981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		dm_table_event(ms->ti->table);
3991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		ms->in_sync = 1;
4001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
4011da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
4021da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
4031da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*-----------------------------------------------------------------
4041da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Reads
4051da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/
4061da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic struct mirror *choose_mirror(struct mirror_set *ms, sector_t sector)
4071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
40806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct mirror *m = get_default_mirror(ms);
40906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
41006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	do {
41106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		if (likely(!atomic_read(&m->error_count)))
41206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			return m;
41306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
41406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		if (m-- == ms->mirror)
41506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			m += ms->nr_mirrors;
41606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	} while (m != get_default_mirror(ms));
41706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
41806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	return NULL;
41906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow}
42006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
42106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic int default_ok(struct mirror *m)
42206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow{
42306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct mirror *default_mirror = get_default_mirror(m->ms);
42406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
42506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	return !atomic_read(&default_mirror->error_count);
42606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow}
42706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
42806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic int mirror_available(struct mirror_set *ms, struct bio *bio)
42906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow{
4301f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
4311f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	region_t region = dm_rh_bio_to_region(ms->rh, bio);
43206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
4331f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	if (log->type->in_sync(log, region, 0))
43406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		return choose_mirror(ms,  bio->bi_sector) ? 1 : 0;
43506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
43606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	return 0;
4371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
4381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
4391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*
4401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * remap a buffer to a particular mirror.
4411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */
44206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic sector_t map_sector(struct mirror *m, struct bio *bio)
44306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow{
4444184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka	if (unlikely(!bio->bi_size))
4454184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka		return 0;
446b441a262e7d1c56fbe21794c91d7a9c83809113fAlasdair G Kergon	return m->offset + dm_target_offset(m->ms->ti, bio->bi_sector);
44706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow}
44806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
44906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic void map_bio(struct mirror *m, struct bio *bio)
4501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
4511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	bio->bi_bdev = m->dev->bdev;
45206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	bio->bi_sector = map_sector(m, bio);
45306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow}
45406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
45522a1ceb1e6a7fbce95a1531ff10bb4fb036d4a37Heinz Mauelshagenstatic void map_region(struct dm_io_region *io, struct mirror *m,
45606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		       struct bio *bio)
45706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow{
45806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	io->bdev = m->dev->bdev;
45906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	io->sector = map_sector(m, bio);
46006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	io->count = bio->bi_size >> 9;
46106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow}
46206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
46304788507686d184d8166918b70ef52311bc36dcbMikulas Patockastatic void hold_bio(struct mirror_set *ms, struct bio *bio)
46404788507686d184d8166918b70ef52311bc36dcbMikulas Patocka{
46504788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	/*
466f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui	 * Lock is required to avoid race condition during suspend
467f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui	 * process.
46804788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 */
469f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui	spin_lock_irq(&ms->lock);
470f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui
47104788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	if (atomic_read(&ms->suspend)) {
472f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui		spin_unlock_irq(&ms->lock);
473f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui
474f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui		/*
475f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui		 * If device is suspended, complete the bio.
476f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui		 */
47704788507686d184d8166918b70ef52311bc36dcbMikulas Patocka		if (dm_noflush_suspending(ms->ti))
47804788507686d184d8166918b70ef52311bc36dcbMikulas Patocka			bio_endio(bio, DM_ENDIO_REQUEUE);
47904788507686d184d8166918b70ef52311bc36dcbMikulas Patocka		else
48004788507686d184d8166918b70ef52311bc36dcbMikulas Patocka			bio_endio(bio, -EIO);
48104788507686d184d8166918b70ef52311bc36dcbMikulas Patocka		return;
48204788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	}
48304788507686d184d8166918b70ef52311bc36dcbMikulas Patocka
48404788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	/*
48504788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 * Hold bio until the suspend is complete.
48604788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	 */
48704788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	bio_list_add(&ms->holds, bio);
48804788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	spin_unlock_irq(&ms->lock);
48904788507686d184d8166918b70ef52311bc36dcbMikulas Patocka}
49004788507686d184d8166918b70ef52311bc36dcbMikulas Patocka
49106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow/*-----------------------------------------------------------------
49206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow * Reads
49306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow *---------------------------------------------------------------*/
49406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic void read_callback(unsigned long error, void *context)
49506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow{
49606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct bio *bio = context;
49706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct mirror *m;
49806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
49906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	m = bio_get_m(bio);
50006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	bio_set_m(bio, NULL);
50106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
50206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (likely(!error)) {
50306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		bio_endio(bio, 0);
50406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		return;
50506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	}
50606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
50706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	fail_mirror(m, DM_RAID1_READ_ERROR);
50806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
50906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (likely(default_ok(m)) || mirror_available(m->ms, bio)) {
51006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		DMWARN_LIMIT("Read failure on mirror device %s.  "
51106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			     "Trying alternative device.",
51206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			     m->dev->name);
51306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		queue_bio(m->ms, bio, bio_rw(bio));
51406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		return;
51506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	}
51606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
51706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	DMERR_LIMIT("Read failure on mirror device %s.  Failing I/O.",
51806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		    m->dev->name);
51906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	bio_endio(bio, -EIO);
52006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow}
52106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
52206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow/* Asynchronous read. */
52306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowstatic void read_async_bio(struct mirror *m, struct bio *bio)
52406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow{
52522a1ceb1e6a7fbce95a1531ff10bb4fb036d4a37Heinz Mauelshagen	struct dm_io_region io;
52606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct dm_io_request io_req = {
52706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		.bi_rw = READ,
52806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		.mem.type = DM_IO_BVEC,
52906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		.mem.ptr.bvec = bio->bi_io_vec + bio->bi_idx,
53006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		.notify.fn = read_callback,
53106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		.notify.context = bio,
53206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		.client = m->ms->io_client,
53306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	};
53406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
53506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	map_region(&io, m, bio);
53606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	bio_set_m(bio, m);
5371f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	BUG_ON(dm_io(&io_req, 1, &io, NULL));
5381f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen}
5391f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen
5401f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagenstatic inline int region_in_sync(struct mirror_set *ms, region_t region,
5411f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen				 int may_block)
5421f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen{
5431f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	int state = dm_rh_get_state(ms->rh, region, may_block);
5441f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	return state == DM_RH_CLEAN || state == DM_RH_DIRTY;
5451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
5461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
5471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void do_reads(struct mirror_set *ms, struct bio_list *reads)
5481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
5491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	region_t region;
5501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct bio *bio;
5511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror *m;
5521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
5531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	while ((bio = bio_list_pop(reads))) {
5541f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		region = dm_rh_bio_to_region(ms->rh, bio);
55506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		m = get_default_mirror(ms);
5561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
5571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		/*
5581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		 * We can only read balance if the region is in sync.
5591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		 */
5601f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		if (likely(region_in_sync(ms, region, 1)))
5611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			m = choose_mirror(ms, bio->bi_sector);
56206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		else if (m && atomic_read(&m->error_count))
56306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			m = NULL;
5641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
56506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		if (likely(m))
56606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			read_async_bio(m, bio);
56706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		else
56806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			bio_endio(bio, -EIO);
5691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
5701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
5711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
5721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*-----------------------------------------------------------------
5731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Writes.
5741da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *
5751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * We do different things with the write io depending on the
5761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * state of the region that it's in:
5771da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *
5781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * SYNC: 	increment pending, use kcopyd to write to *all* mirrors
5791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * RECOVERING:	delay the io until recovery completes
5801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * NOSYNC:	increment pending, just write to the default mirror
5811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/
58272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
58372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
5841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void write_callback(unsigned long error, void *context)
5851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
58672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	unsigned i, ret = 0;
5871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct bio *bio = (struct bio *) context;
5881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms;
58972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	int should_wake = 0;
59072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	unsigned long flags;
5911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
59206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	ms = bio_get_m(bio)->ms;
59306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	bio_set_m(bio, NULL);
5941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
5951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
5961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * NOTE: We don't decrement the pending count here,
5971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * instead it is done by the targets endio function.
5981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * This way we handle both writes to SYNC and NOSYNC
5991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * regions with the same code.
6001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
60160f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	if (likely(!error)) {
60260f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		bio_endio(bio, ret);
60360f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		return;
60460f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	}
6051da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
60672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	for (i = 0; i < ms->nr_mirrors; i++)
60772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		if (test_bit(i, &error))
60872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow			fail_mirror(ms->mirror + i, DM_RAID1_WRITE_ERROR);
60972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
61060f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	/*
61160f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	 * Need to raise event.  Since raising
61260f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	 * events can block, we need to do it in
61360f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	 * the main thread.
61460f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	 */
61560f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	spin_lock_irqsave(&ms->lock, flags);
61660f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	if (!ms->failures.head)
61760f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		should_wake = 1;
61860f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	bio_list_add(&ms->failures, bio);
61960f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	spin_unlock_irqrestore(&ms->lock, flags);
62060f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka	if (should_wake)
62160f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		wakeup_mirrord(ms);
6221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
6231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void do_write(struct mirror_set *ms, struct bio *bio)
6251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
6261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	unsigned int i;
62722a1ceb1e6a7fbce95a1531ff10bb4fb036d4a37Heinz Mauelshagen	struct dm_io_region io[ms->nr_mirrors], *dest = io;
6281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror *m;
62988be163abb5324bab09f5eff9646590eec5314ebMilan Broz	struct dm_io_request io_req = {
630d87f4c14f27dc82d215108d8392a7d26687148a1Tejun Heo		.bi_rw = WRITE | (bio->bi_rw & WRITE_FLUSH_FUA),
63188be163abb5324bab09f5eff9646590eec5314ebMilan Broz		.mem.type = DM_IO_BVEC,
63288be163abb5324bab09f5eff9646590eec5314ebMilan Broz		.mem.ptr.bvec = bio->bi_io_vec + bio->bi_idx,
63388be163abb5324bab09f5eff9646590eec5314ebMilan Broz		.notify.fn = write_callback,
63488be163abb5324bab09f5eff9646590eec5314ebMilan Broz		.notify.context = bio,
63588be163abb5324bab09f5eff9646590eec5314ebMilan Broz		.client = ms->io_client,
63688be163abb5324bab09f5eff9646590eec5314ebMilan Broz	};
6371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6385fc2ffeabb9ee0fc0e71ff16b49f34f0ed3d05b4Mike Snitzer	if (bio->bi_rw & REQ_DISCARD) {
6395fc2ffeabb9ee0fc0e71ff16b49f34f0ed3d05b4Mike Snitzer		io_req.bi_rw |= REQ_DISCARD;
6405fc2ffeabb9ee0fc0e71ff16b49f34f0ed3d05b4Mike Snitzer		io_req.mem.type = DM_IO_KMEM;
6415fc2ffeabb9ee0fc0e71ff16b49f34f0ed3d05b4Mike Snitzer		io_req.mem.ptr.addr = NULL;
6425fc2ffeabb9ee0fc0e71ff16b49f34f0ed3d05b4Mike Snitzer	}
6435fc2ffeabb9ee0fc0e71ff16b49f34f0ed3d05b4Mike Snitzer
64406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	for (i = 0, m = ms->mirror; i < ms->nr_mirrors; i++, m++)
64506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		map_region(dest++, m, bio);
6461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
64706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	/*
64806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	 * Use default mirror because we only need it to retrieve the reference
64906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	 * to the mirror set in write_callback().
65006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	 */
65106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	bio_set_m(bio, get_default_mirror(ms));
65288be163abb5324bab09f5eff9646590eec5314ebMilan Broz
6531f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	BUG_ON(dm_io(&io_req, ms->nr_mirrors, io, NULL));
6541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
6551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void do_writes(struct mirror_set *ms, struct bio_list *writes)
6571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
6581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int state;
6591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct bio *bio;
6601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct bio_list sync, nosync, recover, *this_list = NULL;
6617513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	struct bio_list requeue;
6627513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
6637513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	region_t region;
6641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (!writes->head)
6661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return;
6671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
6691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * Classify each write.
6701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
6711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	bio_list_init(&sync);
6721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	bio_list_init(&nosync);
6731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	bio_list_init(&recover);
6747513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	bio_list_init(&requeue);
6751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	while ((bio = bio_list_pop(writes))) {
6775fc2ffeabb9ee0fc0e71ff16b49f34f0ed3d05b4Mike Snitzer		if ((bio->bi_rw & REQ_FLUSH) ||
6785fc2ffeabb9ee0fc0e71ff16b49f34f0ed3d05b4Mike Snitzer		    (bio->bi_rw & REQ_DISCARD)) {
6794184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka			bio_list_add(&sync, bio);
6804184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka			continue;
6814184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka		}
6824184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka
6837513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		region = dm_rh_bio_to_region(ms->rh, bio);
6847513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow
6857513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		if (log->type->is_remote_recovering &&
6867513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		    log->type->is_remote_recovering(log, region)) {
6877513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow			bio_list_add(&requeue, bio);
6887513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow			continue;
6897513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		}
6907513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow
6917513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		state = dm_rh_get_state(ms->rh, region, 1);
6921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		switch (state) {
6931f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		case DM_RH_CLEAN:
6941f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		case DM_RH_DIRTY:
6951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			this_list = &sync;
6961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			break;
6971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
6981f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		case DM_RH_NOSYNC:
6991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			this_list = &nosync;
7001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			break;
7011da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
7021f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		case DM_RH_RECOVERING:
7031da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			this_list = &recover;
7041da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			break;
7051da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		}
7061da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
7071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		bio_list_add(this_list, bio);
7081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
7091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
7101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
7117513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	 * Add bios that are delayed due to remote recovery
7127513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	 * back on to the write queue
7137513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	 */
7147513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	if (unlikely(requeue.head)) {
7157513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		spin_lock_irq(&ms->lock);
7167513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		bio_list_merge(&ms->writes, &requeue);
7177513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow		spin_unlock_irq(&ms->lock);
71869885683d22d8c05910fd808c01fdce1322739b4Mikulas Patocka		delayed_wake(ms);
7197513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	}
7207513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow
7217513c2a761d69d2a93f17146b3563527d3618ba0Jonathan Brassow	/*
7221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * Increment the pending counts for any regions that will
7231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * be written to (writes to recover regions are going to
7241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * be delayed).
7251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
7261f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_rh_inc_pending(ms->rh, &sync);
7271f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_rh_inc_pending(ms->rh, &nosync);
728d2b698644c97cb033261536a4f2010924a00eac9Jonathan Brassow
729d2b698644c97cb033261536a4f2010924a00eac9Jonathan Brassow	/*
730d2b698644c97cb033261536a4f2010924a00eac9Jonathan Brassow	 * If the flush fails on a previous call and succeeds here,
731d2b698644c97cb033261536a4f2010924a00eac9Jonathan Brassow	 * we must not reset the log_failure variable.  We need
732d2b698644c97cb033261536a4f2010924a00eac9Jonathan Brassow	 * userspace interaction to do that.
733d2b698644c97cb033261536a4f2010924a00eac9Jonathan Brassow	 */
734d2b698644c97cb033261536a4f2010924a00eac9Jonathan Brassow	ms->log_failure = dm_rh_flush(ms->rh) ? 1 : ms->log_failure;
7351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
7361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
7371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * Dispatch io.
7381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
7395528d17de1cf1462f285c40ccaf8e0d0e4c64dc0Mikulas Patocka	if (unlikely(ms->log_failure) && errors_handled(ms)) {
740b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow		spin_lock_irq(&ms->lock);
741b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow		bio_list_merge(&ms->failures, &sync);
742b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow		spin_unlock_irq(&ms->lock);
7431f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		wakeup_mirrord(ms);
744b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	} else
745fc1ff9588a6d56258ff9576a31aa34f17757c666Jonathan Brassow		while ((bio = bio_list_pop(&sync)))
746b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow			do_write(ms, bio);
7471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
7481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	while ((bio = bio_list_pop(&recover)))
7491f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		dm_rh_delay(ms->rh, bio);
7501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
7511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	while ((bio = bio_list_pop(&nosync))) {
752ede5ea0b8b815560dc54c712536fdf0b456b6ad0Mikulas Patocka		if (unlikely(ms->leg_failure) && errors_handled(ms)) {
753ede5ea0b8b815560dc54c712536fdf0b456b6ad0Mikulas Patocka			spin_lock_irq(&ms->lock);
754ede5ea0b8b815560dc54c712536fdf0b456b6ad0Mikulas Patocka			bio_list_add(&ms->failures, bio);
755ede5ea0b8b815560dc54c712536fdf0b456b6ad0Mikulas Patocka			spin_unlock_irq(&ms->lock);
756ede5ea0b8b815560dc54c712536fdf0b456b6ad0Mikulas Patocka			wakeup_mirrord(ms);
757ede5ea0b8b815560dc54c712536fdf0b456b6ad0Mikulas Patocka		} else {
758929be8fcb4b4b65d038e73d3bb34715851a95ca2Mikulas Patocka			map_bio(get_default_mirror(ms), bio);
759929be8fcb4b4b65d038e73d3bb34715851a95ca2Mikulas Patocka			generic_make_request(bio);
760929be8fcb4b4b65d038e73d3bb34715851a95ca2Mikulas Patocka		}
7611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
7621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
7631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
76472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowstatic void do_failures(struct mirror_set *ms, struct bio_list *failures)
76572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow{
76672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct bio *bio;
76772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
7680f398a8403e31c737b429fddc3850093d0bf58d0Mikulas Patocka	if (likely(!failures->head))
76972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		return;
77072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
771b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	/*
772b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * If the log has failed, unattempted writes are being
7730f398a8403e31c737b429fddc3850093d0bf58d0Mikulas Patocka	 * put on the holds list.  We can't issue those writes
774b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * until a log has been marked, so we must store them.
775b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 *
776b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * If a 'noflush' suspend is in progress, we can requeue
777b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * the I/O's to the core.  This give userspace a chance
778b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * to reconfigure the mirror, at which point the core
779b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * will reissue the writes.  If the 'noflush' flag is
780b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * not set, we have no choice but to return errors.
781b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 *
782b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * Some writes on the failures list may have been
783b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * submitted before the log failure and represent a
784b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * failure to write to one of the devices.  It is ok
785b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * for us to treat them the same and requeue them
786b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * as well.
787b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 */
7880f398a8403e31c737b429fddc3850093d0bf58d0Mikulas Patocka	while ((bio = bio_list_pop(failures))) {
78960f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		if (!ms->log_failure) {
7900f398a8403e31c737b429fddc3850093d0bf58d0Mikulas Patocka			ms->in_sync = 0;
791c58098be979509a54021e837a47fcad08db31f94Mikulas Patocka			dm_rh_mark_nosync(ms->rh, bio);
7920f398a8403e31c737b429fddc3850093d0bf58d0Mikulas Patocka		}
79360f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka
79460f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		/*
79560f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		 * If all the legs are dead, fail the I/O.
79660f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		 * If we have been told to handle errors, hold the bio
79760f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		 * and wait for userspace to deal with the problem.
79860f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		 * Otherwise pretend that the I/O succeeded. (This would
79960f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		 * be wrong if the failed leg returned after reboot and
80060f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		 * got replicated back to the good legs.)
80160f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		 */
80260f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		if (!get_valid_mirror(ms))
80360f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka			bio_endio(bio, -EIO);
80460f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		else if (errors_handled(ms))
80560f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka			hold_bio(ms, bio);
80660f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka		else
80760f355ead31e2be8d06ac8acb163df91a1c64e3bMikulas Patocka			bio_endio(bio, 0);
808b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	}
80972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow}
81072f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
81172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassowstatic void trigger_event(struct work_struct *work)
81272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow{
81372f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct mirror_set *ms =
81472f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow		container_of(work, struct mirror_set, trigger_event);
81572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
81672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	dm_table_event(ms->ti->table);
81772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow}
81872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow
8191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*-----------------------------------------------------------------
8201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * kmirrord
8211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/
822a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patockastatic void do_mirror(struct work_struct *work)
8231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
8241f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct mirror_set *ms = container_of(work, struct mirror_set,
8251f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen					     kmirrord_work);
82672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	struct bio_list reads, writes, failures;
82772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	unsigned long flags;
8281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
82972f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	spin_lock_irqsave(&ms->lock, flags);
8301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	reads = ms->reads;
8311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	writes = ms->writes;
83272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	failures = ms->failures;
8331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	bio_list_init(&ms->reads);
8341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	bio_list_init(&ms->writes);
83572f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	bio_list_init(&ms->failures);
83672f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	spin_unlock_irqrestore(&ms->lock, flags);
8371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8381f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_rh_update_states(ms->rh, errors_handled(ms));
8391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	do_recovery(ms);
8401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	do_reads(ms, &reads);
8411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	do_writes(ms, &writes);
84272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	do_failures(ms, &failures);
8431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
8441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*-----------------------------------------------------------------
8461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Target functions
8471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/
8481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic struct mirror_set *alloc_context(unsigned int nr_mirrors,
8491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds					uint32_t region_size,
8501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds					struct dm_target *ti,
851416cd17b1982217bca3dc41b9f00b0b38fdaadadHeinz Mauelshagen					struct dm_dirty_log *dl)
8521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
8531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	size_t len;
8541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms = NULL;
8551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	len = sizeof(*ms) + (sizeof(ms->mirror[0]) * nr_mirrors);
8571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
858dd00cc486ab1c17049a535413d1751ef3482141cYoann Padioleau	ms = kzalloc(len, GFP_KERNEL);
8591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (!ms) {
86072d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Cannot allocate mirror context";
8611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return NULL;
8621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
8631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	spin_lock_init(&ms->lock);
8655339fc2d47d1d720e027b9b832bf5aae8fba2ac0Mikulas Patocka	bio_list_init(&ms->reads);
8665339fc2d47d1d720e027b9b832bf5aae8fba2ac0Mikulas Patocka	bio_list_init(&ms->writes);
8675339fc2d47d1d720e027b9b832bf5aae8fba2ac0Mikulas Patocka	bio_list_init(&ms->failures);
8685339fc2d47d1d720e027b9b832bf5aae8fba2ac0Mikulas Patocka	bio_list_init(&ms->holds);
8691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
8701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	ms->ti = ti;
8711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	ms->nr_mirrors = nr_mirrors;
8721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	ms->nr_regions = dm_sector_div_up(ti->len, region_size);
8731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	ms->in_sync = 0;
874b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	ms->log_failure = 0;
875929be8fcb4b4b65d038e73d3bb34715851a95ca2Mikulas Patocka	ms->leg_failure = 0;
876b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	atomic_set(&ms->suspend, 0);
87772f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	atomic_set(&ms->default_mirror, DEFAULT_MIRROR);
8781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
87995f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	ms->read_record_pool = mempool_create_slab_pool(MIN_READ_RECORDS,
88095f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka						_dm_raid1_read_record_cache);
88195f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka
88206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (!ms->read_record_pool) {
88306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		ti->error = "Error creating mirror read_record_pool";
88406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		kfree(ms);
88506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		return NULL;
88606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	}
88706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
888bda8efec5c706a672e0714d341a342e811f0262aMikulas Patocka	ms->io_client = dm_io_client_create();
88988be163abb5324bab09f5eff9646590eec5314ebMilan Broz	if (IS_ERR(ms->io_client)) {
89088be163abb5324bab09f5eff9646590eec5314ebMilan Broz		ti->error = "Error creating dm_io client";
89106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		mempool_destroy(ms->read_record_pool);
89288be163abb5324bab09f5eff9646590eec5314ebMilan Broz		kfree(ms);
89388be163abb5324bab09f5eff9646590eec5314ebMilan Broz 		return NULL;
89488be163abb5324bab09f5eff9646590eec5314ebMilan Broz	}
89588be163abb5324bab09f5eff9646590eec5314ebMilan Broz
8961f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	ms->rh = dm_region_hash_create(ms, dispatch_bios, wakeup_mirrord,
8971f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen				       wakeup_all_recovery_waiters,
8981f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen				       ms->ti->begin, MAX_RECOVERY,
8991f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen				       dl, region_size, ms->nr_regions);
9001f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	if (IS_ERR(ms->rh)) {
90172d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Error creating dirty region hash";
902a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov		dm_io_client_destroy(ms->io_client);
90306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		mempool_destroy(ms->read_record_pool);
9041da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		kfree(ms);
9051da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return NULL;
9061da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
9071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	return ms;
9091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
9101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void free_context(struct mirror_set *ms, struct dm_target *ti,
9121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			 unsigned int m)
9131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
9141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	while (m--)
9151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		dm_put_device(ti, ms->mirror[m].dev);
9161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
91788be163abb5324bab09f5eff9646590eec5314ebMilan Broz	dm_io_client_destroy(ms->io_client);
9181f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_region_hash_destroy(ms->rh);
91906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	mempool_destroy(ms->read_record_pool);
9201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	kfree(ms);
9211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
9221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int get_mirror(struct mirror_set *ms, struct dm_target *ti,
9241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		      unsigned int mirror, char **argv)
9251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
9264ee218cd67b385759993a6c840ea45f0ee0a8b30Andrew Morton	unsigned long long offset;
92731998ef19385c944600d9a981b96252f98204beeMikulas Patocka	char dummy;
9281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
92931998ef19385c944600d9a981b96252f98204beeMikulas Patocka	if (sscanf(argv[1], "%llu%c", &offset, &dummy) != 1) {
93072d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Invalid offset";
9311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return -EINVAL;
9321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
9331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9348215d6ec5fee1e76545decea2cd73717efb5cb42Nikanth Karthikesan	if (dm_get_device(ti, argv[0], dm_table_get_mode(ti->table),
9351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			  &ms->mirror[mirror].dev)) {
93672d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Device lookup failure";
9371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return -ENXIO;
9381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
9391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
940aa5617c55357d86c9082ba1d66fa9795370c9954Jonathan Brassow	ms->mirror[mirror].ms = ms;
94172f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	atomic_set(&(ms->mirror[mirror].error_count), 0);
94272f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	ms->mirror[mirror].error_type = 0;
9431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	ms->mirror[mirror].offset = offset;
9441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	return 0;
9461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
9471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*
9491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Create dirty log: log_type #log_params <log_params>
9501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */
951416cd17b1982217bca3dc41b9f00b0b38fdaadadHeinz Mauelshagenstatic struct dm_dirty_log *create_dirty_log(struct dm_target *ti,
9521f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen					     unsigned argc, char **argv,
9531f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen					     unsigned *args_used)
9541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
9551f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	unsigned param_count;
956416cd17b1982217bca3dc41b9f00b0b38fdaadadHeinz Mauelshagen	struct dm_dirty_log *dl;
95731998ef19385c944600d9a981b96252f98204beeMikulas Patocka	char dummy;
9581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (argc < 2) {
96072d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Insufficient mirror log arguments";
9611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return NULL;
9621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
9631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
96431998ef19385c944600d9a981b96252f98204beeMikulas Patocka	if (sscanf(argv[1], "%u%c", &param_count, &dummy) != 1) {
96572d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Invalid mirror log argument count";
9661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return NULL;
9671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
9681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	*args_used = 2 + param_count;
9701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (argc < *args_used) {
97272d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Insufficient mirror log arguments";
9731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return NULL;
9741da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
9751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
976c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka	dl = dm_dirty_log_create(argv[0], ti, mirror_flush, param_count,
977c0da3748b9a894b9f9b561ecc2d090a913988a0fMikulas Patocka				 argv + 2);
9781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (!dl) {
97972d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Error creating mirror dirty log";
9801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return NULL;
9811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
9821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
9831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	return dl;
9841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
9851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
986a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassowstatic int parse_features(struct mirror_set *ms, unsigned argc, char **argv,
987a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow			  unsigned *args_used)
988a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow{
989a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	unsigned num_features;
990a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	struct dm_target *ti = ms->ti;
99131998ef19385c944600d9a981b96252f98204beeMikulas Patocka	char dummy;
992a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
993a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	*args_used = 0;
994a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
995a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	if (!argc)
996a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		return 0;
997a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
99831998ef19385c944600d9a981b96252f98204beeMikulas Patocka	if (sscanf(argv[0], "%u%c", &num_features, &dummy) != 1) {
999a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		ti->error = "Invalid number of features";
1000a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		return -EINVAL;
1001a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	}
1002a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
1003a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	argc--;
1004a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	argv++;
1005a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	(*args_used)++;
1006a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
1007a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	if (num_features > argc) {
1008a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		ti->error = "Not enough arguments to support feature count";
1009a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		return -EINVAL;
1010a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	}
1011a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
1012a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	if (!strcmp("handle_errors", argv[0]))
1013a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		ms->features |= DM_RAID1_HANDLE_ERRORS;
1014a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	else {
1015a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		ti->error = "Unrecognised feature requested";
1016a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		return -EINVAL;
1017a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	}
1018a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
1019a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	(*args_used)++;
1020a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
1021a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	return 0;
1022a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow}
1023a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
10241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*
10251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Construct a mirror mapping:
10261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *
10271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * log_type #log_params <log_params>
10281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * #mirrors [mirror_path offset]{2,}
1029a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow * [#features <features>]
10301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *
10311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * log_type is "core" or "disk"
10321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * #log_params is between 1 and 3
1033a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow *
1034a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow * If present, features must be "handle_errors".
10351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */
10361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int mirror_ctr(struct dm_target *ti, unsigned int argc, char **argv)
10371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
10381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int r;
10391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	unsigned int nr_mirrors, m, args_used;
10401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms;
1041416cd17b1982217bca3dc41b9f00b0b38fdaadadHeinz Mauelshagen	struct dm_dirty_log *dl;
104231998ef19385c944600d9a981b96252f98204beeMikulas Patocka	char dummy;
10431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	dl = create_dirty_log(ti, argc, argv, &args_used);
10451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (!dl)
10461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return -EINVAL;
10471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	argv += args_used;
10491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	argc -= args_used;
10501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
105131998ef19385c944600d9a981b96252f98204beeMikulas Patocka	if (!argc || sscanf(argv[0], "%u%c", &nr_mirrors, &dummy) != 1 ||
1052eb69aca5d3370b81450d68edeebc2bb9a3eb9689Heinz Mauelshagen	    nr_mirrors < 2 || nr_mirrors > DM_KCOPYD_MAX_REGIONS + 1) {
105372d9486169a2a8353e022813185ba2f32d7dde69Alasdair G Kergon		ti->error = "Invalid number of mirrors";
1054416cd17b1982217bca3dc41b9f00b0b38fdaadadHeinz Mauelshagen		dm_dirty_log_destroy(dl);
10551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return -EINVAL;
10561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
10571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	argv++, argc--;
10591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1060a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	if (argc < nr_mirrors * 2) {
1061a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		ti->error = "Too few mirror arguments";
1062416cd17b1982217bca3dc41b9f00b0b38fdaadadHeinz Mauelshagen		dm_dirty_log_destroy(dl);
10631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return -EINVAL;
10641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
10651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	ms = alloc_context(nr_mirrors, dl->type->get_region_size(dl), ti, dl);
10671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (!ms) {
1068416cd17b1982217bca3dc41b9f00b0b38fdaadadHeinz Mauelshagen		dm_dirty_log_destroy(dl);
10691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return -ENOMEM;
10701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
10711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/* Get the mirror parameter sets */
10731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	for (m = 0; m < nr_mirrors; m++) {
10741da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		r = get_mirror(ms, ti, m, argv);
10751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		if (r) {
10761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			free_context(ms, ti, m);
10771da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			return r;
10781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		}
10791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		argv += 2;
10801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		argc -= 2;
10811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
10821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	ti->private = ms;
10841f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	ti->split_io = dm_rh_get_region_size(ms->rh);
10854184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka	ti->num_flush_requests = 1;
10865fc2ffeabb9ee0fc0e71ff16b49f34f0ed3d05b4Mike Snitzer	ti->num_discard_requests = 1;
10871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
10889c4376de98719d2768dd919553843de34bb094a6Tejun Heo	ms->kmirrord_wq = alloc_workqueue("kmirrord",
10899c4376de98719d2768dd919553843de34bb094a6Tejun Heo					  WQ_NON_REENTRANT | WQ_MEM_RECLAIM, 0);
10906ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	if (!ms->kmirrord_wq) {
10916ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski		DMERR("couldn't start kmirrord");
1092a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov		r = -ENOMEM;
1093a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov		goto err_free_context;
10946ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	}
10956ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	INIT_WORK(&ms->kmirrord_work, do_mirror);
1096a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	init_timer(&ms->timer);
1097a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	ms->timer_pending = 0;
109872f4b314100bae85c75d8e4c6fec621ab44e777dJonathan Brassow	INIT_WORK(&ms->trigger_event, trigger_event);
10996ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski
1100a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	r = parse_features(ms, argc, argv, &args_used);
1101a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov	if (r)
1102a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov		goto err_destroy_wq;
1103a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
1104a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	argv += args_used;
1105a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	argc -= args_used;
1106a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
1107f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	/*
1108f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	 * Any read-balancing addition depends on the
1109f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	 * DM_RAID1_HANDLE_ERRORS flag being present.
1110f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	 * This is because the decision to balance depends
1111f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	 * on the sync state of a region.  If the above
1112f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	 * flag is not present, we ignore errors; and
1113f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	 * the sync state may be inaccurate.
1114f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow	 */
1115f44db678edcc6f4c2779ac43f63f0b9dfa28b724Jonathan Brassow
1116a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	if (argc) {
1117a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		ti->error = "Too many mirror arguments";
1118a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov		r = -EINVAL;
1119a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov		goto err_destroy_wq;
1120a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow	}
1121a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
1122fa34ce73072f90ecd90dcc43f29d82e70e5f8676Mikulas Patocka	ms->kcopyd_client = dm_kcopyd_client_create();
1123fa34ce73072f90ecd90dcc43f29d82e70e5f8676Mikulas Patocka	if (IS_ERR(ms->kcopyd_client)) {
1124fa34ce73072f90ecd90dcc43f29d82e70e5f8676Mikulas Patocka		r = PTR_ERR(ms->kcopyd_client);
1125a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov		goto err_destroy_wq;
1126fa34ce73072f90ecd90dcc43f29d82e70e5f8676Mikulas Patocka	}
11271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11281f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	wakeup_mirrord(ms);
11291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	return 0;
1130a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov
1131a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhoverr_destroy_wq:
1132a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov	destroy_workqueue(ms->kmirrord_wq);
1133a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhoverr_free_context:
1134a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov	free_context(ms, ti, ms->nr_mirrors);
1135a72cf737e09da409e047863e38410930dae5fe05Dmitry Monakhov	return r;
11361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
11371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void mirror_dtr(struct dm_target *ti)
11391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
11401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms = (struct mirror_set *) ti->private;
11411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1142a2aebe03be60ae4da03507a00d60211d5e0327c3Mikulas Patocka	del_timer_sync(&ms->timer);
11436ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	flush_workqueue(ms->kmirrord_wq);
1144d5ffa387e24646cb1cb55d80fd0f182a00e0edb7Tejun Heo	flush_work_sync(&ms->trigger_event);
1145eb69aca5d3370b81450d68edeebc2bb9a3eb9689Heinz Mauelshagen	dm_kcopyd_client_destroy(ms->kcopyd_client);
11466ad36fe2b451cc85cc7b14f4128286759e217124Holger Smolinski	destroy_workqueue(ms->kmirrord_wq);
11471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	free_context(ms, ti, ms->nr_mirrors);
11481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
11491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*
11511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Mirror mapping function
11521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */
11531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int mirror_map(struct dm_target *ti, struct bio *bio,
11541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		      union map_info *map_context)
11551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
11561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int r, rw = bio_rw(bio);
11571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror *m;
11581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms = ti->private;
115906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct dm_raid1_read_record *read_record = NULL;
11601f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
11611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (rw == WRITE) {
116306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		/* Save region for mirror_end_io() handler */
11641f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		map_context->ll = dm_rh_bio_to_region(ms->rh, bio);
11651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		queue_bio(ms, bio, rw);
1166d2a7ad29a810441e9dacbaddcc2f0c6045390008Kiyoshi Ueda		return DM_MAPIO_SUBMITTED;
11671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
11681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11691f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	r = log->type->in_sync(log, dm_rh_bio_to_region(ms->rh, bio), 0);
11701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (r < 0 && r != -EWOULDBLOCK)
11711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return r;
11721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
117406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	 * If region is not in-sync queue the bio.
11751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
117606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (!r || (r == -EWOULDBLOCK)) {
117706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		if (rw == READA)
117806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			return -EWOULDBLOCK;
11791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
11801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		queue_bio(ms, bio, rw);
1181d2a7ad29a810441e9dacbaddcc2f0c6045390008Kiyoshi Ueda		return DM_MAPIO_SUBMITTED;
11821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
11831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
118406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	/*
118506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	 * The region is in-sync and we can perform reads directly.
118606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	 * Store enough information so we can retry if it fails.
118706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	 */
11881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	m = choose_mirror(ms, bio->bi_sector);
118906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (unlikely(!m))
11901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		return -EIO;
11911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
119206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	read_record = mempool_alloc(ms->read_record_pool, GFP_NOIO);
119306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (likely(read_record)) {
119406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		dm_bio_record(&read_record->details, bio);
119506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		map_context->ptr = read_record;
119606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		read_record->m = m;
119706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	}
119806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
119906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	map_bio(m, bio);
120006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
1201d2a7ad29a810441e9dacbaddcc2f0c6045390008Kiyoshi Ueda	return DM_MAPIO_REMAPPED;
12021da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
12031da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
12041da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int mirror_end_io(struct dm_target *ti, struct bio *bio,
12051da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			 int error, union map_info *map_context)
12061da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
12071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int rw = bio_rw(bio);
12081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms = (struct mirror_set *) ti->private;
120906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct mirror *m = NULL;
121006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct dm_bio_details *bd = NULL;
121106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	struct dm_raid1_read_record *read_record = map_context->ptr;
12121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
12131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	/*
12141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 * We need to dec pending if this was a write.
12151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	 */
121606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (rw == WRITE) {
1217d87f4c14f27dc82d215108d8392a7d26687148a1Tejun Heo		if (!(bio->bi_rw & REQ_FLUSH))
12184184153f9e483f9bb63339ed316e059962fe9794Mikulas Patocka			dm_rh_dec(ms->rh, map_context->ll);
121906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		return error;
122006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	}
12211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
122206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (error == -EOPNOTSUPP)
122306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		goto out;
122406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
12257b6d91daee5cac6402186ff224c3af39d79f4a0eChristoph Hellwig	if ((error == -EWOULDBLOCK) && (bio->bi_rw & REQ_RAHEAD))
122606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		goto out;
122706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
122806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (unlikely(error)) {
122906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		if (!read_record) {
123006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			/*
123106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			 * There wasn't enough memory to record necessary
123206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			 * information for a retry or there was no other
123306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			 * mirror in-sync.
123406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			 */
1235e03f1a842287480aa03732612148c0d333baca61Adrian Bunk			DMERR_LIMIT("Mirror read failed.");
123606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			return -EIO;
123706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		}
1238e03f1a842287480aa03732612148c0d333baca61Adrian Bunk
1239e03f1a842287480aa03732612148c0d333baca61Adrian Bunk		m = read_record->m;
1240e03f1a842287480aa03732612148c0d333baca61Adrian Bunk
124106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		DMERR("Mirror read failed from %s. Trying alternative device.",
124206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		      m->dev->name);
124306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
124406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		fail_mirror(m, DM_RAID1_READ_ERROR);
124506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
124606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		/*
124706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		 * A failed read is requeued for another attempt using an intact
124806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		 * mirror.
124906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		 */
125006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		if (default_ok(m) || mirror_available(ms, bio)) {
125106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			bd = &read_record->details;
125206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
125306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			dm_bio_restore(bd, bio);
125406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			mempool_free(read_record, ms->read_record_pool);
125506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			map_context->ptr = NULL;
125606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			queue_bio(ms, bio, rw);
125706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow			return 1;
125806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		}
125906386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		DMERR("All replicated volumes dead, failing I/O");
126006386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	}
126106386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
126206386bbfd2441416875d0403d405c56822f6ebacJonathan Brassowout:
126306386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	if (read_record) {
126406386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		mempool_free(read_record, ms->read_record_pool);
126506386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow		map_context->ptr = NULL;
126606386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	}
126706386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow
126806386bbfd2441416875d0403d405c56822f6ebacJonathan Brassow	return error;
12691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
12701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1271b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassowstatic void mirror_presuspend(struct dm_target *ti)
12721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
12731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms = (struct mirror_set *) ti->private;
12741f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
12751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
127604788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	struct bio_list holds;
127704788507686d184d8166918b70ef52311bc36dcbMikulas Patocka	struct bio *bio;
127804788507686d184d8166918b70ef52311bc36dcbMikulas Patocka
1279b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	atomic_set(&ms->suspend, 1);
1280b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow
1281b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	/*
1282f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui	 * Process bios in the hold list to start recovery waiting
1283f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui	 * for bios in the hold list. After the process, no bio has
1284f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui	 * a chance to be added in the hold list because ms->suspend
1285f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui	 * is set.
1286f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui	 */
1287f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui	spin_lock_irq(&ms->lock);
1288f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui	holds = ms->holds;
1289f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui	bio_list_init(&ms->holds);
1290f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui	spin_unlock_irq(&ms->lock);
1291f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui
1292f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui	while ((bio = bio_list_pop(&holds)))
1293f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui		hold_bio(ms, bio);
1294f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui
1295f070304094edb8d516423e79edd27c97ec2020b0Takahiro Yasui	/*
1296b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * We must finish up all the work that we've
1297b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * generated (i.e. recovery work).
1298b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 */
12991f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_rh_stop_recovery(ms->rh);
130033184048dc4f9d5550d3b6a88c8e0ff92033eb6eJonathan E Brassow
130133184048dc4f9d5550d3b6a88c8e0ff92033eb6eJonathan E Brassow	wait_event(_kmirrord_recovery_stopped,
13021f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		   !dm_rh_recovery_in_flight(ms->rh));
130333184048dc4f9d5550d3b6a88c8e0ff92033eb6eJonathan E Brassow
1304b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	if (log->type->presuspend && log->type->presuspend(log))
1305b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow		/* FIXME: need better error handling */
1306b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow		DMWARN("log presuspend failed");
1307b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow
1308b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	/*
1309b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * Now that recovery is complete/stopped and the
1310b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * delayed bios are queued, we need to wait for
1311b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * the worker thread to complete.  This way,
1312b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 * we know that all of our I/O has been pushed.
1313b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	 */
1314b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	flush_workqueue(ms->kmirrord_wq);
1315b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow}
1316b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow
1317b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassowstatic void mirror_postsuspend(struct dm_target *ti)
1318b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow{
1319b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	struct mirror_set *ms = ti->private;
13201f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
1321b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow
13226b3df0d7a5e85ad2afd3eecc50e2dee59e876ae8Jonathan Brassow	if (log->type->postsuspend && log->type->postsuspend(log))
13231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		/* FIXME: need better error handling */
1324b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow		DMWARN("log postsuspend failed");
13251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
13261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
13271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void mirror_resume(struct dm_target *ti)
13281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
1329b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	struct mirror_set *ms = ti->private;
13301f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
1331b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow
1332b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	atomic_set(&ms->suspend, 0);
13331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	if (log->type->resume && log->type->resume(log))
13341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		/* FIXME: need better error handling */
13351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		DMWARN("log resume failed");
13361f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	dm_rh_start_recovery(ms->rh);
13371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
13381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1339af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow/*
1340af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow * device_status_char
1341af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow * @m: mirror device/leg we want the status of
1342af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow *
1343af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow * We return one character representing the most severe error
1344af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow * we have encountered.
1345af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow *    A => Alive - No failures
1346af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow *    D => Dead - A write failure occurred leaving mirror out-of-sync
1347af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow *    S => Sync - A sychronization failure occurred, mirror out-of-sync
1348af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow *    R => Read - A read failure occurred, mirror data unaffected
1349af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow *
1350af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow * Returns: <char>
1351af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow */
1352af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassowstatic char device_status_char(struct mirror *m)
1353af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow{
1354af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow	if (!atomic_read(&(m->error_count)))
1355af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		return 'A';
1356af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow
135764b30c46e866bbff8a9e17883a18636adc358455Mikulas Patocka	return (test_bit(DM_RAID1_FLUSH_ERROR, &(m->error_type))) ? 'F' :
135864b30c46e866bbff8a9e17883a18636adc358455Mikulas Patocka		(test_bit(DM_RAID1_WRITE_ERROR, &(m->error_type))) ? 'D' :
1359af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		(test_bit(DM_RAID1_SYNC_ERROR, &(m->error_type))) ? 'S' :
1360af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		(test_bit(DM_RAID1_READ_ERROR, &(m->error_type))) ? 'R' : 'U';
1361af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow}
1362af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow
1363af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow
13641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int mirror_status(struct dm_target *ti, status_type_t type,
13651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			 char *result, unsigned int maxlen)
13661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
1367315dcc226f066c1d3cef79283dcde807fe0e32d1Jonathan E Brassow	unsigned int m, sz = 0;
13681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	struct mirror_set *ms = (struct mirror_set *) ti->private;
13691f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen	struct dm_dirty_log *log = dm_rh_dirty_log(ms->rh);
1370af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow	char buffer[ms->nr_mirrors + 1];
13711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
13721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	switch (type) {
13731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	case STATUSTYPE_INFO:
13741da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		DMEMIT("%d ", ms->nr_mirrors);
1375af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		for (m = 0; m < ms->nr_mirrors; m++) {
13761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds			DMEMIT("%s ", ms->mirror[m].dev->name);
1377af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow			buffer[m] = device_status_char(&(ms->mirror[m]));
1378af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		}
1379af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		buffer[m] = '\0';
13801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1381af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		DMEMIT("%llu/%llu 1 %s ",
13821f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		      (unsigned long long)log->type->get_sync_count(log),
1383af195ac82e38ba802fd86b5a014ed05ef6dd88bbJonathan Brassow		      (unsigned long long)ms->nr_regions, buffer);
1384315dcc226f066c1d3cef79283dcde807fe0e32d1Jonathan E Brassow
13851f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		sz += log->type->status(log, type, result+sz, maxlen-sz);
1386315dcc226f066c1d3cef79283dcde807fe0e32d1Jonathan E Brassow
13871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		break;
13881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
13891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	case STATUSTYPE_TABLE:
13901f965b19437017cea6d3f3f46acdc5acae5fd011Heinz Mauelshagen		sz = log->type->status(log, type, result, maxlen);
1391315dcc226f066c1d3cef79283dcde807fe0e32d1Jonathan E Brassow
1392e52b8f6dbe18c879ad2b5013f991ec9e46813043Jonathan Brassow		DMEMIT("%d", ms->nr_mirrors);
13931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds		for (m = 0; m < ms->nr_mirrors; m++)
1394e52b8f6dbe18c879ad2b5013f991ec9e46813043Jonathan Brassow			DMEMIT(" %s %llu", ms->mirror[m].dev->name,
1395b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow			       (unsigned long long)ms->mirror[m].offset);
1396a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow
1397a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow		if (ms->features & DM_RAID1_HANDLE_ERRORS)
1398a8e6afa2363de7ee0dea1a3297f6236f421c2dd4Jonathan E Brassow			DMEMIT(" 1 handle_errors");
13991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	}
14001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
14011da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	return 0;
14021da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
14031da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
1404af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzerstatic int mirror_iterate_devices(struct dm_target *ti,
1405af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer				  iterate_devices_callout_fn fn, void *data)
1406af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer{
1407af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer	struct mirror_set *ms = ti->private;
1408af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer	int ret = 0;
1409af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer	unsigned i;
1410af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer
1411af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer	for (i = 0; !ret && i < ms->nr_mirrors; i++)
1412af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer		ret = fn(ti, ms->mirror[i].dev,
14135dea271b6d87bd1d79a59c1d5baac2596a841c37Mike Snitzer			 ms->mirror[i].offset, ti->len, data);
1414af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer
1415af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer	return ret;
1416af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer}
1417af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer
14181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic struct target_type mirror_target = {
14191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.name	 = "mirror",
14209c4376de98719d2768dd919553843de34bb094a6Tejun Heo	.version = {1, 12, 1},
14211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.module	 = THIS_MODULE,
14221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.ctr	 = mirror_ctr,
14231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.dtr	 = mirror_dtr,
14241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.map	 = mirror_map,
14251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.end_io	 = mirror_end_io,
1426b80aa7a0c268d3ae0c472f648af1e3e4a359765cJonathan Brassow	.presuspend = mirror_presuspend,
14271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.postsuspend = mirror_postsuspend,
14281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.resume	 = mirror_resume,
14291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	.status	 = mirror_status,
1430af4874e03ed82f050d5872d8c39ce64bf16b5c38Mike Snitzer	.iterate_devices = mirror_iterate_devices,
14311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds};
14321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
14331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int __init dm_mirror_init(void)
14341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
14351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	int r;
14361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
143795f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	_dm_raid1_read_record_cache = KMEM_CACHE(dm_raid1_read_record, 0);
143895f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	if (!_dm_raid1_read_record_cache) {
143995f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka		DMERR("Can't allocate dm_raid1_read_record cache");
144095f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka		r = -ENOMEM;
144195f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka		goto bad_cache;
144295f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	}
144395f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka
14441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	r = dm_register_target(&mirror_target);
144595f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	if (r < 0) {
14460cd3312434cd1f29bee6bff53bf2790d733ad2a2Alasdair G Kergon		DMERR("Failed to register mirror target");
144795f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka		goto bad_target;
144895f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	}
144995f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka
145095f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	return 0;
14511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
145295f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patockabad_target:
145395f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	kmem_cache_destroy(_dm_raid1_read_record_cache);
145495f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patockabad_cache:
14551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds	return r;
14561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
14571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
14581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void __exit dm_mirror_exit(void)
14591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{
146010d3bd09a3c25df114f74f7f86e1b58d070bef32Mikulas Patocka	dm_unregister_target(&mirror_target);
146195f8fac8dc6139fedfb87746e0c8fda9b803cb46Mikulas Patocka	kmem_cache_destroy(_dm_raid1_read_record_cache);
14621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}
14631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
14641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/* Module hooks */
14651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsmodule_init(dm_mirror_init);
14661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsmodule_exit(dm_mirror_exit);
14671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds
14681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus TorvaldsMODULE_DESCRIPTION(DM_NAME " mirror target");
14691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus TorvaldsMODULE_AUTHOR("Joe Thornber");
14701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus TorvaldsMODULE_LICENSE("GPL");
1471