dm-raid1.c revision 179e09172ab663b8587ecc46bb18a56a770304a9
11da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/* 21da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Copyright (C) 2003 Sistina Software Limited. 31da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * 41da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * This file is released under the GPL. 51da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 61da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 71da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include "dm.h" 81da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include "dm-bio-list.h" 91da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include "dm-io.h" 101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include "dm-log.h" 111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include "kcopyd.h" 121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/ctype.h> 141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/init.h> 151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/mempool.h> 161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/module.h> 171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/pagemap.h> 181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/slab.h> 191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/time.h> 201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/vmalloc.h> 211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#include <linux/workqueue.h> 221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic struct workqueue_struct *_kmirrord_wq; 241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic struct work_struct _kmirrord_work; 251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic inline void wake(void) 271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds queue_work(_kmirrord_wq, &_kmirrord_work); 291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*----------------------------------------------------------------- 321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Region hash 331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * 341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * The mirror splits itself up into discrete regions. Each 351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * region can be in one of three states: clean, dirty, 361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * nosync. There is no need to put clean regions in the hash. 371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * 381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * In addition to being present in the hash table a region _may_ 391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * be present on one of three lists. 401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * 411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * clean_regions: Regions on this list have no io pending to 421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * them, they are in sync, we are no longer interested in them, 431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * they are dull. rh_update_states() will remove them from the 441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * hash table. 451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * 461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * quiesced_regions: These regions have been spun down, ready 471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * for recovery. rh_recovery_start() will remove regions from 481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * this list and hand them to kmirrord, which will schedule the 491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * recovery io with kcopyd. 501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * 511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * recovered_regions: Regions that kcopyd has successfully 521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * recovered. rh_update_states() will now schedule any delayed 531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * io, up the recovery_count, and remove the region from the 541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * hash. 551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * 561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * There are 2 locks: 571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * A rw spin lock 'hash_lock' protects just the hash table, 581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * this is never held in write mode from interrupt context, 591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * which I believe means that we only have to disable irqs when 601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * doing a write lock. 611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * 621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * An ordinary spin lock 'region_lock' that protects the three 631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * lists in the region_hash, with the 'state', 'list' and 641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * 'bhs_delayed' fields of the regions. This is used from irq 651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * context, so all other uses will have to suspend local irqs. 661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/ 671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstruct mirror_set; 681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstruct region_hash { 691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct mirror_set *ms; 701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds uint32_t region_size; 711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds unsigned region_shift; 721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* holds persistent region state */ 741da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct dirty_log *log; 751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* hash table */ 771da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rwlock_t hash_lock; 781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds mempool_t *region_pool; 791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds unsigned int mask; 801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds unsigned int nr_buckets; 811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct list_head *buckets; 821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds spinlock_t region_lock; 841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct semaphore recovery_count; 851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct list_head clean_regions; 861da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct list_head quiesced_regions; 871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct list_head recovered_regions; 881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}; 891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsenum { 911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds RH_CLEAN, 921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds RH_DIRTY, 931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds RH_NOSYNC, 941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds RH_RECOVERING 951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}; 961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstruct region { 981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct region_hash *rh; /* FIXME: can we get rid of this ? */ 991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds region_t key; 1001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds int state; 1011da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 1021da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct list_head hash_list; 1031da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct list_head list; 1041da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 1051da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds atomic_t pending; 1061da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct bio_list delayed_bios; 1071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}; 1081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 1091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/* 1101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Conversion fns 1111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 1121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic inline region_t bio_to_region(struct region_hash *rh, struct bio *bio) 1131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 1141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return bio->bi_sector >> rh->region_shift; 1151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 1161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 1171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic inline sector_t region_to_sector(struct region_hash *rh, region_t region) 1181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 1191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return region << rh->region_shift; 1201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 1211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 1221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/* FIXME move this */ 1231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void queue_bio(struct mirror_set *ms, struct bio *bio, int rw); 1241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 1251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#define MIN_REGIONS 64 1261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#define MAX_RECOVERY 1 1271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int rh_init(struct region_hash *rh, struct mirror_set *ms, 1281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct dirty_log *log, uint32_t region_size, 1291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds region_t nr_regions) 1301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 1311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds unsigned int nr_buckets, max_buckets; 1321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds size_t i; 1331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 1341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* 1351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Calculate a suitable number of buckets for our hash 1361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * table. 1371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 1381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds max_buckets = nr_regions >> 6; 1391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds for (nr_buckets = 128u; nr_buckets < max_buckets; nr_buckets <<= 1) 1401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ; 1411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds nr_buckets >>= 1; 1421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 1431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh->ms = ms; 1441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh->log = log; 1451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh->region_size = region_size; 1461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh->region_shift = ffs(region_size) - 1; 1471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rwlock_init(&rh->hash_lock); 1481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh->mask = nr_buckets - 1; 1491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh->nr_buckets = nr_buckets; 1501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 1511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh->buckets = vmalloc(nr_buckets * sizeof(*rh->buckets)); 1521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (!rh->buckets) { 1531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds DMERR("unable to allocate region hash memory"); 1541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return -ENOMEM; 1551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 1561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 1571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds for (i = 0; i < nr_buckets; i++) 1581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds INIT_LIST_HEAD(rh->buckets + i); 1591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 1601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds spin_lock_init(&rh->region_lock); 1611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds sema_init(&rh->recovery_count, 0); 1621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds INIT_LIST_HEAD(&rh->clean_regions); 1631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds INIT_LIST_HEAD(&rh->quiesced_regions); 1641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds INIT_LIST_HEAD(&rh->recovered_regions); 1651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 1660eaae62abaa1ad1f231932b6cdd9fb1b91df6651Matthew Dobson rh->region_pool = mempool_create_kmalloc_pool(MIN_REGIONS, 1670eaae62abaa1ad1f231932b6cdd9fb1b91df6651Matthew Dobson sizeof(struct region)); 1681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (!rh->region_pool) { 1691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds vfree(rh->buckets); 1701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh->buckets = NULL; 1711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return -ENOMEM; 1721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 1731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 1741da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return 0; 1751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 1761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 1771da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void rh_exit(struct region_hash *rh) 1781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 1791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds unsigned int h; 1801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct region *reg, *nreg; 1811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 1821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds BUG_ON(!list_empty(&rh->quiesced_regions)); 1831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds for (h = 0; h < rh->nr_buckets; h++) { 1841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds list_for_each_entry_safe(reg, nreg, rh->buckets + h, hash_list) { 1851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds BUG_ON(atomic_read(®->pending)); 1861da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds mempool_free(reg, rh->region_pool); 1871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 1881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 1891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 1901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (rh->log) 1911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds dm_destroy_dirty_log(rh->log); 1921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (rh->region_pool) 1931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds mempool_destroy(rh->region_pool); 1941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds vfree(rh->buckets); 1951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 1961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 1971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#define RH_HASH_MULT 2654435387U 1981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 1991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic inline unsigned int rh_hash(struct region_hash *rh, region_t region) 2001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 2011da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return (unsigned int) ((region * RH_HASH_MULT) >> 12) & rh->mask; 2021da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 2031da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 2041da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic struct region *__rh_lookup(struct region_hash *rh, region_t region) 2051da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 2061da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct region *reg; 2071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 2081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds list_for_each_entry (reg, rh->buckets + rh_hash(rh, region), hash_list) 2091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (reg->key == region) 2101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return reg; 2111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 2121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return NULL; 2131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 2141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 2151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void __rh_insert(struct region_hash *rh, struct region *reg) 2161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 2171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds unsigned int h = rh_hash(rh, reg->key); 2181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds list_add(®->hash_list, rh->buckets + h); 2191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 2201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 2211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic struct region *__rh_alloc(struct region_hash *rh, region_t region) 2221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 2231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct region *reg, *nreg; 2241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 2251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds read_unlock(&rh->hash_lock); 2261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds nreg = mempool_alloc(rh->region_pool, GFP_NOIO); 2271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds nreg->state = rh->log->type->in_sync(rh->log, region, 1) ? 2281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds RH_CLEAN : RH_NOSYNC; 2291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds nreg->rh = rh; 2301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds nreg->key = region; 2311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 2321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds INIT_LIST_HEAD(&nreg->list); 2331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 2341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds atomic_set(&nreg->pending, 0); 2351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds bio_list_init(&nreg->delayed_bios); 2361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds write_lock_irq(&rh->hash_lock); 2371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 2381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds reg = __rh_lookup(rh, region); 2391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (reg) 2401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* we lost the race */ 2411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds mempool_free(nreg, rh->region_pool); 2421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 2431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds else { 2441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds __rh_insert(rh, nreg); 2451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (nreg->state == RH_CLEAN) { 2461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds spin_lock(&rh->region_lock); 2471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds list_add(&nreg->list, &rh->clean_regions); 2481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds spin_unlock(&rh->region_lock); 2491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 2501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds reg = nreg; 2511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 2521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds write_unlock_irq(&rh->hash_lock); 2531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds read_lock(&rh->hash_lock); 2541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 2551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return reg; 2561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 2571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 2581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic inline struct region *__rh_find(struct region_hash *rh, region_t region) 2591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 2601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct region *reg; 2611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 2621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds reg = __rh_lookup(rh, region); 2631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (!reg) 2641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds reg = __rh_alloc(rh, region); 2651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 2661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return reg; 2671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 2681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 2691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int rh_state(struct region_hash *rh, region_t region, int may_block) 2701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 2711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds int r; 2721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct region *reg; 2731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 2741da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds read_lock(&rh->hash_lock); 2751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds reg = __rh_lookup(rh, region); 2761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds read_unlock(&rh->hash_lock); 2771da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 2781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (reg) 2791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return reg->state; 2801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 2811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* 2821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * The region wasn't in the hash, so we fall back to the 2831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * dirty log. 2841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 2851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds r = rh->log->type->in_sync(rh->log, region, may_block); 2861da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 2871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* 2881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Any error from the dirty log (eg. -EWOULDBLOCK) gets 2891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * taken as a RH_NOSYNC 2901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 2911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return r == 1 ? RH_CLEAN : RH_NOSYNC; 2921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 2931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 2941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic inline int rh_in_sync(struct region_hash *rh, 2951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds region_t region, int may_block) 2961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 2971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds int state = rh_state(rh, region, may_block); 2981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return state == RH_CLEAN || state == RH_DIRTY; 2991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 3001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 3011da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void dispatch_bios(struct mirror_set *ms, struct bio_list *bio_list) 3021da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 3031da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct bio *bio; 3041da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 3051da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds while ((bio = bio_list_pop(bio_list))) { 3061da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds queue_bio(ms, bio, WRITE); 3071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 3081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 3091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 3101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void rh_update_states(struct region_hash *rh) 3111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 3121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct region *reg, *next; 3131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 3141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds LIST_HEAD(clean); 3151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds LIST_HEAD(recovered); 3161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 3171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* 3181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Quickly grab the lists. 3191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 3201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds write_lock_irq(&rh->hash_lock); 3211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds spin_lock(&rh->region_lock); 3221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (!list_empty(&rh->clean_regions)) { 3231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds list_splice(&rh->clean_regions, &clean); 3241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds INIT_LIST_HEAD(&rh->clean_regions); 3251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 3261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds list_for_each_entry (reg, &clean, list) { 3271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh->log->type->clear_region(rh->log, reg->key); 3281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds list_del(®->hash_list); 3291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 3301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 3311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 3321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (!list_empty(&rh->recovered_regions)) { 3331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds list_splice(&rh->recovered_regions, &recovered); 3341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds INIT_LIST_HEAD(&rh->recovered_regions); 3351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 3361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds list_for_each_entry (reg, &recovered, list) 3371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds list_del(®->hash_list); 3381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 3391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds spin_unlock(&rh->region_lock); 3401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds write_unlock_irq(&rh->hash_lock); 3411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 3421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* 3431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * All the regions on the recovered and clean lists have 3441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * now been pulled out of the system, so no need to do 3451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * any more locking. 3461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 3471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds list_for_each_entry_safe (reg, next, &recovered, list) { 3481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh->log->type->clear_region(rh->log, reg->key); 3491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh->log->type->complete_resync_work(rh->log, reg->key, 1); 3501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds dispatch_bios(rh->ms, ®->delayed_bios); 3511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds up(&rh->recovery_count); 3521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds mempool_free(reg, rh->region_pool); 3531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 3541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 3551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (!list_empty(&recovered)) 3561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh->log->type->flush(rh->log); 3571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 3581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds list_for_each_entry_safe (reg, next, &clean, list) 3591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds mempool_free(reg, rh->region_pool); 3601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 3611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 3621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void rh_inc(struct region_hash *rh, region_t region) 3631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 3641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct region *reg; 3651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 3661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds read_lock(&rh->hash_lock); 3671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds reg = __rh_find(rh, region); 368844e8d904a7c1446e3f040683b4a0645c3eb168fJun'ichi Nomura 3697692c5dd48026d952199c2b97c3418f927cc0407Jonathan E Brassow spin_lock_irq(&rh->region_lock); 370844e8d904a7c1446e3f040683b4a0645c3eb168fJun'ichi Nomura atomic_inc(®->pending); 371844e8d904a7c1446e3f040683b4a0645c3eb168fJun'ichi Nomura 3721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (reg->state == RH_CLEAN) { 3731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds reg->state = RH_DIRTY; 3741da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds list_del_init(®->list); /* take off the clean list */ 3757692c5dd48026d952199c2b97c3418f927cc0407Jonathan E Brassow spin_unlock_irq(&rh->region_lock); 3767692c5dd48026d952199c2b97c3418f927cc0407Jonathan E Brassow 3777692c5dd48026d952199c2b97c3418f927cc0407Jonathan E Brassow rh->log->type->mark_region(rh->log, reg->key); 3787692c5dd48026d952199c2b97c3418f927cc0407Jonathan E Brassow } else 3797692c5dd48026d952199c2b97c3418f927cc0407Jonathan E Brassow spin_unlock_irq(&rh->region_lock); 3807692c5dd48026d952199c2b97c3418f927cc0407Jonathan E Brassow 3811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 3821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds read_unlock(&rh->hash_lock); 3831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 3841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 3851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void rh_inc_pending(struct region_hash *rh, struct bio_list *bios) 3861da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 3871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct bio *bio; 3881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 3891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds for (bio = bios->head; bio; bio = bio->bi_next) 3901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh_inc(rh, bio_to_region(rh, bio)); 3911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 3921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 3931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void rh_dec(struct region_hash *rh, region_t region) 3941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 3951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds unsigned long flags; 3961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct region *reg; 3971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds int should_wake = 0; 3981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 3991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds read_lock(&rh->hash_lock); 4001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds reg = __rh_lookup(rh, region); 4011da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds read_unlock(&rh->hash_lock); 4021da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 4037692c5dd48026d952199c2b97c3418f927cc0407Jonathan E Brassow spin_lock_irqsave(&rh->region_lock, flags); 4041da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (atomic_dec_and_test(®->pending)) { 405930d332a23682202c07df0276dd665a57755b37dJun'ichi Nomura /* 406930d332a23682202c07df0276dd665a57755b37dJun'ichi Nomura * There is no pending I/O for this region. 407930d332a23682202c07df0276dd665a57755b37dJun'ichi Nomura * We can move the region to corresponding list for next action. 408930d332a23682202c07df0276dd665a57755b37dJun'ichi Nomura * At this point, the region is not yet connected to any list. 409930d332a23682202c07df0276dd665a57755b37dJun'ichi Nomura * 410930d332a23682202c07df0276dd665a57755b37dJun'ichi Nomura * If the state is RH_NOSYNC, the region should be kept off 411930d332a23682202c07df0276dd665a57755b37dJun'ichi Nomura * from clean list. 412930d332a23682202c07df0276dd665a57755b37dJun'ichi Nomura * The hash entry for RH_NOSYNC will remain in memory 413930d332a23682202c07df0276dd665a57755b37dJun'ichi Nomura * until the region is recovered or the map is reloaded. 414930d332a23682202c07df0276dd665a57755b37dJun'ichi Nomura */ 415930d332a23682202c07df0276dd665a57755b37dJun'ichi Nomura 416930d332a23682202c07df0276dd665a57755b37dJun'ichi Nomura /* do nothing for RH_NOSYNC */ 4171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (reg->state == RH_RECOVERING) { 4181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds list_add_tail(®->list, &rh->quiesced_regions); 419930d332a23682202c07df0276dd665a57755b37dJun'ichi Nomura } else if (reg->state == RH_DIRTY) { 4201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds reg->state = RH_CLEAN; 4211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds list_add(®->list, &rh->clean_regions); 4221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 4231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds should_wake = 1; 4241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 4257692c5dd48026d952199c2b97c3418f927cc0407Jonathan E Brassow spin_unlock_irqrestore(&rh->region_lock, flags); 4261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 4271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (should_wake) 4281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds wake(); 4291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 4301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 4311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/* 4321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Starts quiescing a region in preparation for recovery. 4331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 4341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int __rh_recovery_prepare(struct region_hash *rh) 4351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 4361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds int r; 4371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct region *reg; 4381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds region_t region; 4391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 4401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* 4411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Ask the dirty log what's next. 4421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 4431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds r = rh->log->type->get_resync_work(rh->log, ®ion); 4441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (r <= 0) 4451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return r; 4461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 4471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* 4481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Get this region, and start it quiescing by setting the 4491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * recovering flag. 4501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 4511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds read_lock(&rh->hash_lock); 4521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds reg = __rh_find(rh, region); 4531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds read_unlock(&rh->hash_lock); 4541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 4551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds spin_lock_irq(&rh->region_lock); 4561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds reg->state = RH_RECOVERING; 4571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 4581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* Already quiesced ? */ 4591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (atomic_read(®->pending)) 4601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds list_del_init(®->list); 461179e09172ab663b8587ecc46bb18a56a770304a9Akinobu Mita else 462179e09172ab663b8587ecc46bb18a56a770304a9Akinobu Mita list_move(®->list, &rh->quiesced_regions); 4631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 4641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds spin_unlock_irq(&rh->region_lock); 4651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 4661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return 1; 4671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 4681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 4691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void rh_recovery_prepare(struct region_hash *rh) 4701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 4711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds while (!down_trylock(&rh->recovery_count)) 4721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (__rh_recovery_prepare(rh) <= 0) { 4731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds up(&rh->recovery_count); 4741da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds break; 4751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 4761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 4771da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 4781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/* 4791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Returns any quiesced regions. 4801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 4811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic struct region *rh_recovery_start(struct region_hash *rh) 4821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 4831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct region *reg = NULL; 4841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 4851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds spin_lock_irq(&rh->region_lock); 4861da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (!list_empty(&rh->quiesced_regions)) { 4871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds reg = list_entry(rh->quiesced_regions.next, 4881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct region, list); 4891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds list_del_init(®->list); /* remove from the quiesced list */ 4901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 4911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds spin_unlock_irq(&rh->region_lock); 4921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 4931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return reg; 4941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 4951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 4961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/* FIXME: success ignored for now */ 4971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void rh_recovery_end(struct region *reg, int success) 4981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 4991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct region_hash *rh = reg->rh; 5001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 5011da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds spin_lock_irq(&rh->region_lock); 5021da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds list_add(®->list, ®->rh->recovered_regions); 5031da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds spin_unlock_irq(&rh->region_lock); 5041da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 5051da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds wake(); 5061da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 5071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 5081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void rh_flush(struct region_hash *rh) 5091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 5101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh->log->type->flush(rh->log); 5111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 5121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 5131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void rh_delay(struct region_hash *rh, struct bio *bio) 5141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 5151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct region *reg; 5161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 5171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds read_lock(&rh->hash_lock); 5181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds reg = __rh_find(rh, bio_to_region(rh, bio)); 5191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds bio_list_add(®->delayed_bios, bio); 5201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds read_unlock(&rh->hash_lock); 5211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 5221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 5231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void rh_stop_recovery(struct region_hash *rh) 5241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 5251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds int i; 5261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 5271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* wait for any recovering regions */ 5281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds for (i = 0; i < MAX_RECOVERY; i++) 5291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds down(&rh->recovery_count); 5301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 5311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 5321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void rh_start_recovery(struct region_hash *rh) 5331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 5341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds int i; 5351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 5361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds for (i = 0; i < MAX_RECOVERY; i++) 5371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds up(&rh->recovery_count); 5381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 5391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds wake(); 5401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 5411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 5421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*----------------------------------------------------------------- 5431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Mirror set structures. 5441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/ 5451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstruct mirror { 5461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds atomic_t error_count; 5471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct dm_dev *dev; 5481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds sector_t offset; 5491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}; 5501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 5511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstruct mirror_set { 5521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct dm_target *ti; 5531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct list_head list; 5541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct region_hash rh; 5551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct kcopyd_client *kcopyd_client; 5561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 5571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds spinlock_t lock; /* protects the next two lists */ 5581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct bio_list reads; 5591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct bio_list writes; 5601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 5611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* recovery */ 5621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds region_t nr_regions; 5631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds int in_sync; 5641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 565a1a190807074bd6ad8771e00b00752771ae586cbJonathan E Brassow struct mirror *default_mirror; /* Default mirror */ 566a1a190807074bd6ad8771e00b00752771ae586cbJonathan E Brassow 5671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds unsigned int nr_mirrors; 5681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct mirror mirror[0]; 5691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}; 5701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 5711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/* 5721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Every mirror should look like this one. 5731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 5741da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#define DEFAULT_MIRROR 0 5751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 5761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/* 5771da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * This is yucky. We squirrel the mirror_set struct away inside 5781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * bi_next for write buffers. This is safe since the bh 5791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * doesn't get submitted to the lower levels of block layer. 5801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 5811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic struct mirror_set *bio_get_ms(struct bio *bio) 5821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 5831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return (struct mirror_set *) bio->bi_next; 5841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 5851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 5861da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void bio_set_ms(struct bio *bio, struct mirror_set *ms) 5871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 5881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds bio->bi_next = (struct bio *) ms; 5891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 5901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 5911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*----------------------------------------------------------------- 5921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Recovery. 5931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * 5941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * When a mirror is first activated we may find that some regions 5951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * are in the no-sync state. We have to recover these by 5961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * recopying from the default mirror to all the others. 5971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/ 5981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void recovery_complete(int read_err, unsigned int write_err, 5991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds void *context) 6001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 6011da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct region *reg = (struct region *) context; 6021da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 6031da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* FIXME: better error handling */ 6041da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh_recovery_end(reg, read_err || write_err); 6051da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 6061da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 6071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int recover(struct mirror_set *ms, struct region *reg) 6081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 6091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds int r; 6101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds unsigned int i; 6111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct io_region from, to[KCOPYD_MAX_REGIONS], *dest; 6121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct mirror *m; 6131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds unsigned long flags = 0; 6141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 6151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* fill in the source */ 616a1a190807074bd6ad8771e00b00752771ae586cbJonathan E Brassow m = ms->default_mirror; 6171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds from.bdev = m->dev->bdev; 6181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds from.sector = m->offset + region_to_sector(reg->rh, reg->key); 6191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (reg->key == (ms->nr_regions - 1)) { 6201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* 6211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * The final region may be smaller than 6221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * region_size. 6231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 6241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds from.count = ms->ti->len & (reg->rh->region_size - 1); 6251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (!from.count) 6261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds from.count = reg->rh->region_size; 6271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } else 6281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds from.count = reg->rh->region_size; 6291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 6301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* fill in the destinations */ 6311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds for (i = 0, dest = to; i < ms->nr_mirrors; i++) { 632a1a190807074bd6ad8771e00b00752771ae586cbJonathan E Brassow if (&ms->mirror[i] == ms->default_mirror) 6331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds continue; 6341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 6351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds m = ms->mirror + i; 6361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds dest->bdev = m->dev->bdev; 6371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds dest->sector = m->offset + region_to_sector(reg->rh, reg->key); 6381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds dest->count = from.count; 6391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds dest++; 6401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 6411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 6421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* hand to kcopyd */ 6431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds set_bit(KCOPYD_IGNORE_ERROR, &flags); 6441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds r = kcopyd_copy(ms->kcopyd_client, &from, ms->nr_mirrors - 1, to, flags, 6451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds recovery_complete, reg); 6461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 6471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return r; 6481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 6491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 6501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void do_recovery(struct mirror_set *ms) 6511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 6521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds int r; 6531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct region *reg; 6541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct dirty_log *log = ms->rh.log; 6551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 6561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* 6571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Start quiescing some regions. 6581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 6591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh_recovery_prepare(&ms->rh); 6601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 6611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* 6621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Copy any already quiesced regions. 6631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 6641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds while ((reg = rh_recovery_start(&ms->rh))) { 6651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds r = recover(ms, reg); 6661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (r) 6671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh_recovery_end(reg, 0); 6681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 6691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 6701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* 6711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Update the in sync flag. 6721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 6731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (!ms->in_sync && 6741da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds (log->type->get_sync_count(log) == ms->nr_regions)) { 6751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* the sync is complete */ 6761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds dm_table_event(ms->ti->table); 6771da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ms->in_sync = 1; 6781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 6791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 6801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 6811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*----------------------------------------------------------------- 6821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Reads 6831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/ 6841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic struct mirror *choose_mirror(struct mirror_set *ms, sector_t sector) 6851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 6861da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* FIXME: add read balancing */ 687a1a190807074bd6ad8771e00b00752771ae586cbJonathan E Brassow return ms->default_mirror; 6881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 6891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 6901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/* 6911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * remap a buffer to a particular mirror. 6921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 6931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void map_bio(struct mirror_set *ms, struct mirror *m, struct bio *bio) 6941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 6951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds bio->bi_bdev = m->dev->bdev; 6961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds bio->bi_sector = m->offset + (bio->bi_sector - ms->ti->begin); 6971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 6981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 6991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void do_reads(struct mirror_set *ms, struct bio_list *reads) 7001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 7011da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds region_t region; 7021da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct bio *bio; 7031da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct mirror *m; 7041da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 7051da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds while ((bio = bio_list_pop(reads))) { 7061da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds region = bio_to_region(&ms->rh, bio); 7071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 7081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* 7091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * We can only read balance if the region is in sync. 7101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 7111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (rh_in_sync(&ms->rh, region, 0)) 7121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds m = choose_mirror(ms, bio->bi_sector); 7131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds else 714a1a190807074bd6ad8771e00b00752771ae586cbJonathan E Brassow m = ms->default_mirror; 7151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 7161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds map_bio(ms, m, bio); 7171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds generic_make_request(bio); 7181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 7191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 7201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 7211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*----------------------------------------------------------------- 7221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Writes. 7231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * 7241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * We do different things with the write io depending on the 7251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * state of the region that it's in: 7261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * 7271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * SYNC: increment pending, use kcopyd to write to *all* mirrors 7281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * RECOVERING: delay the io until recovery completes 7291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * NOSYNC: increment pending, just write to the default mirror 7301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/ 7311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void write_callback(unsigned long error, void *context) 7321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 7331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds unsigned int i; 7341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds int uptodate = 1; 7351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct bio *bio = (struct bio *) context; 7361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct mirror_set *ms; 7371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 7381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ms = bio_get_ms(bio); 7391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds bio_set_ms(bio, NULL); 7401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 7411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* 7421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * NOTE: We don't decrement the pending count here, 7431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * instead it is done by the targets endio function. 7441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * This way we handle both writes to SYNC and NOSYNC 7451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * regions with the same code. 7461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 7471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 7481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (error) { 7491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* 7501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * only error the io if all mirrors failed. 7511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * FIXME: bogus 7521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 7531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds uptodate = 0; 7541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds for (i = 0; i < ms->nr_mirrors; i++) 7551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (!test_bit(i, &error)) { 7561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds uptodate = 1; 7571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds break; 7581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 7591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 7601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds bio_endio(bio, bio->bi_size, 0); 7611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 7621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 7631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void do_write(struct mirror_set *ms, struct bio *bio) 7641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 7651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds unsigned int i; 7661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct io_region io[KCOPYD_MAX_REGIONS+1]; 7671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct mirror *m; 7681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 7691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds for (i = 0; i < ms->nr_mirrors; i++) { 7701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds m = ms->mirror + i; 7711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 7721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds io[i].bdev = m->dev->bdev; 7731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds io[i].sector = m->offset + (bio->bi_sector - ms->ti->begin); 7741da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds io[i].count = bio->bi_size >> 9; 7751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 7761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 7771da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds bio_set_ms(bio, ms); 7781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds dm_io_async_bvec(ms->nr_mirrors, io, WRITE, 7791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds bio->bi_io_vec + bio->bi_idx, 7801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds write_callback, bio); 7811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 7821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 7831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void do_writes(struct mirror_set *ms, struct bio_list *writes) 7841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 7851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds int state; 7861da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct bio *bio; 7871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct bio_list sync, nosync, recover, *this_list = NULL; 7881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 7891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (!writes->head) 7901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return; 7911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 7921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* 7931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Classify each write. 7941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 7951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds bio_list_init(&sync); 7961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds bio_list_init(&nosync); 7971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds bio_list_init(&recover); 7981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 7991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds while ((bio = bio_list_pop(writes))) { 8001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds state = rh_state(&ms->rh, bio_to_region(&ms->rh, bio), 1); 8011da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds switch (state) { 8021da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds case RH_CLEAN: 8031da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds case RH_DIRTY: 8041da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds this_list = &sync; 8051da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds break; 8061da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 8071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds case RH_NOSYNC: 8081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds this_list = &nosync; 8091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds break; 8101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 8111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds case RH_RECOVERING: 8121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds this_list = &recover; 8131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds break; 8141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 8151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 8161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds bio_list_add(this_list, bio); 8171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 8181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 8191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* 8201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Increment the pending counts for any regions that will 8211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * be written to (writes to recover regions are going to 8221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * be delayed). 8231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 8241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh_inc_pending(&ms->rh, &sync); 8251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh_inc_pending(&ms->rh, &nosync); 8261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh_flush(&ms->rh); 8271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 8281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* 8291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Dispatch io. 8301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 8311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds while ((bio = bio_list_pop(&sync))) 8321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds do_write(ms, bio); 8331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 8341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds while ((bio = bio_list_pop(&recover))) 8351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh_delay(&ms->rh, bio); 8361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 8371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds while ((bio = bio_list_pop(&nosync))) { 838a1a190807074bd6ad8771e00b00752771ae586cbJonathan E Brassow map_bio(ms, ms->default_mirror, bio); 8391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds generic_make_request(bio); 8401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 8411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 8421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 8431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*----------------------------------------------------------------- 8441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * kmirrord 8451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/ 8461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic LIST_HEAD(_mirror_sets); 8471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic DECLARE_RWSEM(_mirror_sets_lock); 8481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 8491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void do_mirror(struct mirror_set *ms) 8501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 8511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct bio_list reads, writes; 8521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 8531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds spin_lock(&ms->lock); 8541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds reads = ms->reads; 8551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds writes = ms->writes; 8561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds bio_list_init(&ms->reads); 8571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds bio_list_init(&ms->writes); 8581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds spin_unlock(&ms->lock); 8591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 8601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh_update_states(&ms->rh); 8611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds do_recovery(ms); 8621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds do_reads(ms, &reads); 8631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds do_writes(ms, &writes); 8641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 8651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 8661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void do_work(void *ignored) 8671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 8681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct mirror_set *ms; 8691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 8701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds down_read(&_mirror_sets_lock); 8711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds list_for_each_entry (ms, &_mirror_sets, list) 8721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds do_mirror(ms); 8731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds up_read(&_mirror_sets_lock); 8741da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 8751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 8761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/*----------------------------------------------------------------- 8771da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Target functions 8781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *---------------------------------------------------------------*/ 8791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic struct mirror_set *alloc_context(unsigned int nr_mirrors, 8801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds uint32_t region_size, 8811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct dm_target *ti, 8821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct dirty_log *dl) 8831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 8841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds size_t len; 8851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct mirror_set *ms = NULL; 8861da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 8871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (array_too_big(sizeof(*ms), sizeof(ms->mirror[0]), nr_mirrors)) 8881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return NULL; 8891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 8901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds len = sizeof(*ms) + (sizeof(ms->mirror[0]) * nr_mirrors); 8911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 8921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ms = kmalloc(len, GFP_KERNEL); 8931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (!ms) { 8941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ti->error = "dm-mirror: Cannot allocate mirror context"; 8951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return NULL; 8961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 8971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 8981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds memset(ms, 0, len); 8991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds spin_lock_init(&ms->lock); 9001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 9011da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ms->ti = ti; 9021da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ms->nr_mirrors = nr_mirrors; 9031da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ms->nr_regions = dm_sector_div_up(ti->len, region_size); 9041da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ms->in_sync = 0; 905a1a190807074bd6ad8771e00b00752771ae586cbJonathan E Brassow ms->default_mirror = &ms->mirror[DEFAULT_MIRROR]; 9061da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 9071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (rh_init(&ms->rh, ms, dl, region_size, ms->nr_regions)) { 9081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ti->error = "dm-mirror: Error creating dirty region hash"; 9091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds kfree(ms); 9101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return NULL; 9111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 9121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 9131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return ms; 9141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 9151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 9161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void free_context(struct mirror_set *ms, struct dm_target *ti, 9171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds unsigned int m) 9181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 9191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds while (m--) 9201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds dm_put_device(ti, ms->mirror[m].dev); 9211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 9221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh_exit(&ms->rh); 9231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds kfree(ms); 9241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 9251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 9261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic inline int _check_region_size(struct dm_target *ti, uint32_t size) 9271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 9281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return !(size % (PAGE_SIZE >> 9) || (size & (size - 1)) || 9291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds size > ti->len); 9301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 9311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 9321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int get_mirror(struct mirror_set *ms, struct dm_target *ti, 9331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds unsigned int mirror, char **argv) 9341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 9354ee218cd67b385759993a6c840ea45f0ee0a8b30Andrew Morton unsigned long long offset; 9361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 9374ee218cd67b385759993a6c840ea45f0ee0a8b30Andrew Morton if (sscanf(argv[1], "%llu", &offset) != 1) { 9381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ti->error = "dm-mirror: Invalid offset"; 9391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return -EINVAL; 9401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 9411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 9421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (dm_get_device(ti, argv[0], offset, ti->len, 9431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds dm_table_get_mode(ti->table), 9441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds &ms->mirror[mirror].dev)) { 9451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ti->error = "dm-mirror: Device lookup failure"; 9461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return -ENXIO; 9471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 9481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 9491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ms->mirror[mirror].offset = offset; 9501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 9511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return 0; 9521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 9531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 9541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int add_mirror_set(struct mirror_set *ms) 9551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 9561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds down_write(&_mirror_sets_lock); 9571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds list_add_tail(&ms->list, &_mirror_sets); 9581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds up_write(&_mirror_sets_lock); 9591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds wake(); 9601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 9611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return 0; 9621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 9631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 9641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void del_mirror_set(struct mirror_set *ms) 9651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 9661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds down_write(&_mirror_sets_lock); 9671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds list_del(&ms->list); 9681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds up_write(&_mirror_sets_lock); 9691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 9701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 9711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/* 9721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Create dirty log: log_type #log_params <log_params> 9731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 9741da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic struct dirty_log *create_dirty_log(struct dm_target *ti, 9751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds unsigned int argc, char **argv, 9761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds unsigned int *args_used) 9771da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 9781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds unsigned int param_count; 9791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct dirty_log *dl; 9801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 9811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (argc < 2) { 9821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ti->error = "dm-mirror: Insufficient mirror log arguments"; 9831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return NULL; 9841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 9851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 9861da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (sscanf(argv[1], "%u", ¶m_count) != 1) { 9871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ti->error = "dm-mirror: Invalid mirror log argument count"; 9881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return NULL; 9891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 9901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 9911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds *args_used = 2 + param_count; 9921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 9931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (argc < *args_used) { 9941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ti->error = "dm-mirror: Insufficient mirror log arguments"; 9951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return NULL; 9961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 9971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 9981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds dl = dm_create_dirty_log(argv[0], ti, param_count, argv + 2); 9991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (!dl) { 10001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ti->error = "dm-mirror: Error creating mirror dirty log"; 10011da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return NULL; 10021da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 10031da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 10041da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (!_check_region_size(ti, dl->type->get_region_size(dl))) { 10051da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ti->error = "dm-mirror: Invalid region size"; 10061da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds dm_destroy_dirty_log(dl); 10071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return NULL; 10081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 10091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 10101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return dl; 10111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 10121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 10131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/* 10141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Construct a mirror mapping: 10151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * 10161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * log_type #log_params <log_params> 10171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * #mirrors [mirror_path offset]{2,} 10181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * 10191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * log_type is "core" or "disk" 10201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * #log_params is between 1 and 3 10211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 10221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds#define DM_IO_PAGES 64 10231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int mirror_ctr(struct dm_target *ti, unsigned int argc, char **argv) 10241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 10251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds int r; 10261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds unsigned int nr_mirrors, m, args_used; 10271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct mirror_set *ms; 10281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct dirty_log *dl; 10291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 10301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds dl = create_dirty_log(ti, argc, argv, &args_used); 10311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (!dl) 10321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return -EINVAL; 10331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 10341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds argv += args_used; 10351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds argc -= args_used; 10361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 10371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (!argc || sscanf(argv[0], "%u", &nr_mirrors) != 1 || 10381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds nr_mirrors < 2 || nr_mirrors > KCOPYD_MAX_REGIONS + 1) { 10391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ti->error = "dm-mirror: Invalid number of mirrors"; 10401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds dm_destroy_dirty_log(dl); 10411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return -EINVAL; 10421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 10431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 10441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds argv++, argc--; 10451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 10461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (argc != nr_mirrors * 2) { 10471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ti->error = "dm-mirror: Wrong number of mirror arguments"; 10481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds dm_destroy_dirty_log(dl); 10491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return -EINVAL; 10501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 10511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 10521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ms = alloc_context(nr_mirrors, dl->type->get_region_size(dl), ti, dl); 10531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (!ms) { 10541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds dm_destroy_dirty_log(dl); 10551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return -ENOMEM; 10561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 10571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 10581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* Get the mirror parameter sets */ 10591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds for (m = 0; m < nr_mirrors; m++) { 10601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds r = get_mirror(ms, ti, m, argv); 10611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (r) { 10621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds free_context(ms, ti, m); 10631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return r; 10641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 10651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds argv += 2; 10661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds argc -= 2; 10671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 10681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 10691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds ti->private = ms; 1070d88854f08961d26f3a63cfae7972188d26a128e4Alasdair G Kergon ti->split_io = ms->rh.region_size; 10711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 10721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds r = kcopyd_client_create(DM_IO_PAGES, &ms->kcopyd_client); 10731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (r) { 10741da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds free_context(ms, ti, ms->nr_mirrors); 10751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return r; 10761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 10771da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 10781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds add_mirror_set(ms); 10791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return 0; 10801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 10811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 10821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void mirror_dtr(struct dm_target *ti) 10831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 10841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct mirror_set *ms = (struct mirror_set *) ti->private; 10851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 10861da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds del_mirror_set(ms); 10871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds kcopyd_client_destroy(ms->kcopyd_client); 10881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds free_context(ms, ti, ms->nr_mirrors); 10891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 10901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 10911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void queue_bio(struct mirror_set *ms, struct bio *bio, int rw) 10921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 10931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds int should_wake = 0; 10941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct bio_list *bl; 10951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 10961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds bl = (rw == WRITE) ? &ms->writes : &ms->reads; 10971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds spin_lock(&ms->lock); 10981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds should_wake = !(bl->head); 10991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds bio_list_add(bl, bio); 11001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds spin_unlock(&ms->lock); 11011da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 11021da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (should_wake) 11031da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds wake(); 11041da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 11051da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 11061da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/* 11071da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * Mirror mapping function 11081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 11091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int mirror_map(struct dm_target *ti, struct bio *bio, 11101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds union map_info *map_context) 11111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 11121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds int r, rw = bio_rw(bio); 11131da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct mirror *m; 11141da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct mirror_set *ms = ti->private; 11151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 11161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds map_context->ll = bio->bi_sector >> ms->rh.region_shift; 11171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 11181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (rw == WRITE) { 11191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds queue_bio(ms, bio, rw); 11201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return 0; 11211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 11221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 11231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds r = ms->rh.log->type->in_sync(ms->rh.log, 11241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds bio_to_region(&ms->rh, bio), 0); 11251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (r < 0 && r != -EWOULDBLOCK) 11261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return r; 11271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 11281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (r == -EWOULDBLOCK) /* FIXME: ugly */ 11291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds r = 0; 11301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 11311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* 11321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * We don't want to fast track a recovery just for a read 11331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * ahead. So we just let it silently fail. 11341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * FIXME: get rid of this. 11351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 11361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (!r && rw == READA) 11371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return -EIO; 11381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 11391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (!r) { 11401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* Pass this io over to the daemon */ 11411da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds queue_bio(ms, bio, rw); 11421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return 0; 11431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 11441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 11451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds m = choose_mirror(ms, bio->bi_sector); 11461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (!m) 11471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return -EIO; 11481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 11491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds map_bio(ms, m, bio); 11501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return 1; 11511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 11521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 11531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int mirror_end_io(struct dm_target *ti, struct bio *bio, 11541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds int error, union map_info *map_context) 11551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 11561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds int rw = bio_rw(bio); 11571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct mirror_set *ms = (struct mirror_set *) ti->private; 11581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds region_t region = map_context->ll; 11591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 11601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* 11611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds * We need to dec pending if this was a write. 11621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds */ 11631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (rw == WRITE) 11641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh_dec(&ms->rh, region); 11651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 11661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return 0; 11671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 11681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 11691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void mirror_postsuspend(struct dm_target *ti) 11701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 11711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct mirror_set *ms = (struct mirror_set *) ti->private; 11721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct dirty_log *log = ms->rh.log; 11731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 11741da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh_stop_recovery(&ms->rh); 11751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (log->type->suspend && log->type->suspend(log)) 11761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* FIXME: need better error handling */ 11771da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds DMWARN("log suspend failed"); 11781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 11791da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 11801da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void mirror_resume(struct dm_target *ti) 11811da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 11821da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct mirror_set *ms = (struct mirror_set *) ti->private; 11831da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct dirty_log *log = ms->rh.log; 11841da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (log->type->resume && log->type->resume(log)) 11851da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds /* FIXME: need better error handling */ 11861da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds DMWARN("log resume failed"); 11871da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds rh_start_recovery(&ms->rh); 11881da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 11891da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 11901da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int mirror_status(struct dm_target *ti, status_type_t type, 11911da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds char *result, unsigned int maxlen) 11921da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 11931da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds unsigned int m, sz; 11941da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds struct mirror_set *ms = (struct mirror_set *) ti->private; 11951da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 11961da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds sz = ms->rh.log->type->status(ms->rh.log, type, result, maxlen); 11971da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 11981da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds switch (type) { 11991da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds case STATUSTYPE_INFO: 12001da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds DMEMIT("%d ", ms->nr_mirrors); 12011da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds for (m = 0; m < ms->nr_mirrors; m++) 12021da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds DMEMIT("%s ", ms->mirror[m].dev->name); 12031da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 12044ee218cd67b385759993a6c840ea45f0ee0a8b30Andrew Morton DMEMIT("%llu/%llu", 12054ee218cd67b385759993a6c840ea45f0ee0a8b30Andrew Morton (unsigned long long)ms->rh.log->type-> 12064ee218cd67b385759993a6c840ea45f0ee0a8b30Andrew Morton get_sync_count(ms->rh.log), 12074ee218cd67b385759993a6c840ea45f0ee0a8b30Andrew Morton (unsigned long long)ms->nr_regions); 12081da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds break; 12091da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 12101da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds case STATUSTYPE_TABLE: 12111da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds DMEMIT("%d ", ms->nr_mirrors); 12121da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds for (m = 0; m < ms->nr_mirrors; m++) 12134ee218cd67b385759993a6c840ea45f0ee0a8b30Andrew Morton DMEMIT("%s %llu ", ms->mirror[m].dev->name, 12144ee218cd67b385759993a6c840ea45f0ee0a8b30Andrew Morton (unsigned long long)ms->mirror[m].offset); 12151da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 12161da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 12171da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return 0; 12181da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 12191da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 12201da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic struct target_type mirror_target = { 12211da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds .name = "mirror", 12221da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds .version = {1, 0, 1}, 12231da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds .module = THIS_MODULE, 12241da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds .ctr = mirror_ctr, 12251da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds .dtr = mirror_dtr, 12261da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds .map = mirror_map, 12271da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds .end_io = mirror_end_io, 12281da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds .postsuspend = mirror_postsuspend, 12291da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds .resume = mirror_resume, 12301da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds .status = mirror_status, 12311da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds}; 12321da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 12331da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic int __init dm_mirror_init(void) 12341da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 12351da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds int r; 12361da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 12371da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds r = dm_dirty_log_init(); 12381da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (r) 12391da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return r; 12401da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 124148f1f5328267f52a34e61b8b0e6fc55a23c1348aAlasdair G Kergon _kmirrord_wq = create_singlethread_workqueue("kmirrord"); 12421da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (!_kmirrord_wq) { 12431da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds DMERR("couldn't start kmirrord"); 12441da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds dm_dirty_log_exit(); 12451da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return r; 12461da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 12471da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds INIT_WORK(&_kmirrord_work, do_work, NULL); 12481da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 12491da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds r = dm_register_target(&mirror_target); 12501da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (r < 0) { 12511da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds DMERR("%s: Failed to register mirror target", 12521da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds mirror_target.name); 12531da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds dm_dirty_log_exit(); 12541da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds destroy_workqueue(_kmirrord_wq); 12551da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds } 12561da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 12571da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds return r; 12581da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 12591da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 12601da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsstatic void __exit dm_mirror_exit(void) 12611da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds{ 12621da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds int r; 12631da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 12641da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds r = dm_unregister_target(&mirror_target); 12651da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds if (r < 0) 12661da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds DMERR("%s: unregister failed %d", mirror_target.name, r); 12671da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 12681da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds destroy_workqueue(_kmirrord_wq); 12691da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds dm_dirty_log_exit(); 12701da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds} 12711da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 12721da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds/* Module hooks */ 12731da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsmodule_init(dm_mirror_init); 12741da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvaldsmodule_exit(dm_mirror_exit); 12751da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus Torvalds 12761da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus TorvaldsMODULE_DESCRIPTION(DM_NAME " mirror target"); 12771da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus TorvaldsMODULE_AUTHOR("Joe Thornber"); 12781da177e4c3f41524e886b7f1b8a0c1fc7321cacLinus TorvaldsMODULE_LICENSE("GPL"); 1279