diff options
author | Linus Torvalds <torvalds@linux-foundation.org> | 2009-04-03 12:08:19 -0400 |
---|---|---|
committer | Linus Torvalds <torvalds@linux-foundation.org> | 2009-04-03 12:08:19 -0400 |
commit | 223cdea4c4b5af5181b2da00ac85711d1e0c737c (patch) | |
tree | dfe7226c70ddabbf2e2e63924ba636345278e79c /drivers/md/raid1.h | |
parent | 31e6e2dac575c9d21a6ec56ca52ae89086baa705 (diff) | |
parent | c8f517c444e4f9f55b5b5ca202b8404691a35805 (diff) |
Merge branch 'for-linus' of git://neil.brown.name/md
* 'for-linus' of git://neil.brown.name/md: (53 commits)
md/raid5 revise rules for when to update metadata during reshape
md/raid5: minor code cleanups in make_request.
md: remove CONFIG_MD_RAID_RESHAPE config option.
md/raid5: be more careful about write ordering when reshaping.
md: don't display meaningless values in sysfs files resync_start and sync_speed
md/raid5: allow layout and chunksize to be changed on active array.
md/raid5: reshape using largest of old and new chunk size
md/raid5: prepare for allowing reshape to change layout
md/raid5: prepare for allowing reshape to change chunksize.
md/raid5: clearly differentiate 'before' and 'after' stripes during reshape.
Documentation/md.txt update
md: allow number of drives in raid5 to be reduced
md/raid5: change reshape-progress measurement to cope with reshaping backwards.
md: add explicit method to signal the end of a reshape.
md/raid5: enhance raid5_size to work correctly with negative delta_disks
md/raid5: drop qd_idx from r6_state
md/raid6: move raid6 data processing to raid6_pq.ko
md: raid5 run(): Fix max_degraded for raid level 4.
md: 'array_size' sysfs attribute
md: centralize ->array_sectors modifications
...
Diffstat (limited to 'drivers/md/raid1.h')
-rw-r--r-- | drivers/md/raid1.h | 132 |
1 files changed, 132 insertions, 0 deletions
diff --git a/drivers/md/raid1.h b/drivers/md/raid1.h new file mode 100644 index 000000000000..1620eea3d57c --- /dev/null +++ b/drivers/md/raid1.h | |||
@@ -0,0 +1,132 @@ | |||
1 | #ifndef _RAID1_H | ||
2 | #define _RAID1_H | ||
3 | |||
4 | typedef struct mirror_info mirror_info_t; | ||
5 | |||
6 | struct mirror_info { | ||
7 | mdk_rdev_t *rdev; | ||
8 | sector_t head_position; | ||
9 | }; | ||
10 | |||
11 | /* | ||
12 | * memory pools need a pointer to the mddev, so they can force an unplug | ||
13 | * when memory is tight, and a count of the number of drives that the | ||
14 | * pool was allocated for, so they know how much to allocate and free. | ||
15 | * mddev->raid_disks cannot be used, as it can change while a pool is active | ||
16 | * These two datums are stored in a kmalloced struct. | ||
17 | */ | ||
18 | |||
19 | struct pool_info { | ||
20 | mddev_t *mddev; | ||
21 | int raid_disks; | ||
22 | }; | ||
23 | |||
24 | |||
25 | typedef struct r1bio_s r1bio_t; | ||
26 | |||
27 | struct r1_private_data_s { | ||
28 | mddev_t *mddev; | ||
29 | mirror_info_t *mirrors; | ||
30 | int raid_disks; | ||
31 | int last_used; | ||
32 | sector_t next_seq_sect; | ||
33 | spinlock_t device_lock; | ||
34 | |||
35 | struct list_head retry_list; | ||
36 | /* queue pending writes and submit them on unplug */ | ||
37 | struct bio_list pending_bio_list; | ||
38 | /* queue of writes that have been unplugged */ | ||
39 | struct bio_list flushing_bio_list; | ||
40 | |||
41 | /* for use when syncing mirrors: */ | ||
42 | |||
43 | spinlock_t resync_lock; | ||
44 | int nr_pending; | ||
45 | int nr_waiting; | ||
46 | int nr_queued; | ||
47 | int barrier; | ||
48 | sector_t next_resync; | ||
49 | int fullsync; /* set to 1 if a full sync is needed, | ||
50 | * (fresh device added). | ||
51 | * Cleared when a sync completes. | ||
52 | */ | ||
53 | |||
54 | wait_queue_head_t wait_barrier; | ||
55 | |||
56 | struct pool_info *poolinfo; | ||
57 | |||
58 | struct page *tmppage; | ||
59 | |||
60 | mempool_t *r1bio_pool; | ||
61 | mempool_t *r1buf_pool; | ||
62 | }; | ||
63 | |||
64 | typedef struct r1_private_data_s conf_t; | ||
65 | |||
66 | /* | ||
67 | * this is the only point in the RAID code where we violate | ||
68 | * C type safety. mddev->private is an 'opaque' pointer. | ||
69 | */ | ||
70 | #define mddev_to_conf(mddev) ((conf_t *) mddev->private) | ||
71 | |||
72 | /* | ||
73 | * this is our 'private' RAID1 bio. | ||
74 | * | ||
75 | * it contains information about what kind of IO operations were started | ||
76 | * for this RAID1 operation, and about their status: | ||
77 | */ | ||
78 | |||
79 | struct r1bio_s { | ||
80 | atomic_t remaining; /* 'have we finished' count, | ||
81 | * used from IRQ handlers | ||
82 | */ | ||
83 | atomic_t behind_remaining; /* number of write-behind ios remaining | ||
84 | * in this BehindIO request | ||
85 | */ | ||
86 | sector_t sector; | ||
87 | int sectors; | ||
88 | unsigned long state; | ||
89 | mddev_t *mddev; | ||
90 | /* | ||
91 | * original bio going to /dev/mdx | ||
92 | */ | ||
93 | struct bio *master_bio; | ||
94 | /* | ||
95 | * if the IO is in READ direction, then this is where we read | ||
96 | */ | ||
97 | int read_disk; | ||
98 | |||
99 | struct list_head retry_list; | ||
100 | struct bitmap_update *bitmap_update; | ||
101 | /* | ||
102 | * if the IO is in WRITE direction, then multiple bios are used. | ||
103 | * We choose the number when they are allocated. | ||
104 | */ | ||
105 | struct bio *bios[0]; | ||
106 | /* DO NOT PUT ANY NEW FIELDS HERE - bios array is contiguously alloced*/ | ||
107 | }; | ||
108 | |||
109 | /* when we get a read error on a read-only array, we redirect to another | ||
110 | * device without failing the first device, or trying to over-write to | ||
111 | * correct the read error. To keep track of bad blocks on a per-bio | ||
112 | * level, we store IO_BLOCKED in the appropriate 'bios' pointer | ||
113 | */ | ||
114 | #define IO_BLOCKED ((struct bio*)1) | ||
115 | |||
116 | /* bits for r1bio.state */ | ||
117 | #define R1BIO_Uptodate 0 | ||
118 | #define R1BIO_IsSync 1 | ||
119 | #define R1BIO_Degraded 2 | ||
120 | #define R1BIO_BehindIO 3 | ||
121 | #define R1BIO_Barrier 4 | ||
122 | #define R1BIO_BarrierRetry 5 | ||
123 | /* For write-behind requests, we call bi_end_io when | ||
124 | * the last non-write-behind device completes, providing | ||
125 | * any write was successful. Otherwise we call when | ||
126 | * any write-behind write succeeds, otherwise we call | ||
127 | * with failure when last write completes (and all failed). | ||
128 | * Record that bi_end_io was called with this flag... | ||
129 | */ | ||
130 | #define R1BIO_Returned 6 | ||
131 | |||
132 | #endif | ||