Loading...
1/* SPDX-License-Identifier: GPL-2.0 */
2#ifndef _RAID10_H
3#define _RAID10_H
4
5/* Note: raid10_info.rdev can be set to NULL asynchronously by
6 * raid10_remove_disk.
7 * There are three safe ways to access raid10_info.rdev.
8 * 1/ when holding mddev->reconfig_mutex
9 * 2/ when resync/recovery/reshape is known to be happening - i.e. in code
10 * that is called as part of performing resync/recovery/reshape.
11 * 3/ while holding rcu_read_lock(), use rcu_dereference to get the pointer
12 * and if it is non-NULL, increment rdev->nr_pending before dropping the
13 * RCU lock.
14 * When .rdev is set to NULL, the nr_pending count checked again and if it has
15 * been incremented, the pointer is put back in .rdev.
16 */
17
18struct raid10_info {
19 struct md_rdev *rdev, *replacement;
20 sector_t head_position;
21 int recovery_disabled; /* matches
22 * mddev->recovery_disabled
23 * when we shouldn't try
24 * recovering this device.
25 */
26};
27
28struct r10conf {
29 struct mddev *mddev;
30 struct raid10_info *mirrors;
31 struct raid10_info *mirrors_new, *mirrors_old;
32 spinlock_t device_lock;
33
34 /* geometry */
35 struct geom {
36 int raid_disks;
37 int near_copies; /* number of copies laid out
38 * raid0 style */
39 int far_copies; /* number of copies laid out
40 * at large strides across drives
41 */
42 int far_offset; /* far_copies are offset by 1
43 * stripe instead of many
44 */
45 sector_t stride; /* distance between far copies.
46 * This is size / far_copies unless
47 * far_offset, in which case it is
48 * 1 stripe.
49 */
50 int far_set_size; /* The number of devices in a set,
51 * where a 'set' are devices that
52 * contain far/offset copies of
53 * each other.
54 */
55 int chunk_shift; /* shift from chunks to sectors */
56 sector_t chunk_mask;
57 } prev, geo;
58 int copies; /* near_copies * far_copies.
59 * must be <= raid_disks
60 */
61
62 sector_t dev_sectors; /* temp copy of
63 * mddev->dev_sectors */
64 sector_t reshape_progress;
65 sector_t reshape_safe;
66 unsigned long reshape_checkpoint;
67 sector_t offset_diff;
68
69 struct list_head retry_list;
70 /* A separate list of r1bio which just need raid_end_bio_io called.
71 * This mustn't happen for writes which had any errors if the superblock
72 * needs to be written.
73 */
74 struct list_head bio_end_io_list;
75
76 /* queue pending writes and submit them on unplug */
77 struct bio_list pending_bio_list;
78
79 seqlock_t resync_lock;
80 atomic_t nr_pending;
81 int nr_waiting;
82 int nr_queued;
83 int barrier;
84 int array_freeze_pending;
85 sector_t next_resync;
86 int fullsync; /* set to 1 if a full sync is needed,
87 * (fresh device added).
88 * Cleared when a sync completes.
89 */
90 int have_replacement; /* There is at least one
91 * replacement device.
92 */
93 wait_queue_head_t wait_barrier;
94
95 mempool_t r10bio_pool;
96 mempool_t r10buf_pool;
97 struct page *tmppage;
98 struct bio_set bio_split;
99
100 /* When taking over an array from a different personality, we store
101 * the new thread here until we fully activate the array.
102 */
103 struct md_thread __rcu *thread;
104
105 /*
106 * Keep track of cluster resync window to send to other nodes.
107 */
108 sector_t cluster_sync_low;
109 sector_t cluster_sync_high;
110};
111
112/*
113 * this is our 'private' RAID10 bio.
114 *
115 * it contains information about what kind of IO operations were started
116 * for this RAID10 operation, and about their status:
117 */
118
119struct r10bio {
120 atomic_t remaining; /* 'have we finished' count,
121 * used from IRQ handlers
122 */
123 sector_t sector; /* virtual sector number */
124 int sectors;
125 unsigned long state;
126 struct mddev *mddev;
127 /*
128 * original bio going to /dev/mdx
129 */
130 struct bio *master_bio;
131 /*
132 * if the IO is in READ direction, then this is where we read
133 */
134 int read_slot;
135
136 struct list_head retry_list;
137 /*
138 * if the IO is in WRITE direction, then multiple bios are used,
139 * one for each copy.
140 * When resyncing we also use one for each copy.
141 * When reconstructing, we use 2 bios, one for read, one for write.
142 * We choose the number when they are allocated.
143 * We sometimes need an extra bio to write to the replacement.
144 */
145 struct r10dev {
146 struct bio *bio;
147 union {
148 struct bio *repl_bio; /* used for resync and
149 * writes */
150 struct md_rdev *rdev; /* used for reads
151 * (read_slot >= 0) */
152 };
153 sector_t addr;
154 int devnum;
155 } devs[];
156};
157
158/* bits for r10bio.state */
159enum r10bio_state {
160 R10BIO_Uptodate,
161 R10BIO_IsSync,
162 R10BIO_IsRecover,
163 R10BIO_IsReshape,
164 R10BIO_Degraded,
165/* Set ReadError on bios that experience a read error
166 * so that raid10d knows what to do with them.
167 */
168 R10BIO_ReadError,
169/* If a write for this request means we can clear some
170 * known-bad-block records, we set this flag.
171 */
172 R10BIO_MadeGood,
173 R10BIO_WriteError,
174/* During a reshape we might be performing IO on the
175 * 'previous' part of the array, in which case this
176 * flag is set
177 */
178 R10BIO_Previous,
179/* failfast devices did receive failfast requests. */
180 R10BIO_FailFast,
181 R10BIO_Discard,
182};
183#endif
1#ifndef _RAID10_H
2#define _RAID10_H
3
4struct raid10_info {
5 struct md_rdev *rdev, *replacement;
6 sector_t head_position;
7 int recovery_disabled; /* matches
8 * mddev->recovery_disabled
9 * when we shouldn't try
10 * recovering this device.
11 */
12};
13
14struct r10conf {
15 struct mddev *mddev;
16 struct raid10_info *mirrors;
17 struct raid10_info *mirrors_new, *mirrors_old;
18 spinlock_t device_lock;
19
20 /* geometry */
21 struct geom {
22 int raid_disks;
23 int near_copies; /* number of copies laid out
24 * raid0 style */
25 int far_copies; /* number of copies laid out
26 * at large strides across drives
27 */
28 int far_offset; /* far_copies are offset by 1
29 * stripe instead of many
30 */
31 sector_t stride; /* distance between far copies.
32 * This is size / far_copies unless
33 * far_offset, in which case it is
34 * 1 stripe.
35 */
36 int far_set_size; /* The number of devices in a set,
37 * where a 'set' are devices that
38 * contain far/offset copies of
39 * each other.
40 */
41 int chunk_shift; /* shift from chunks to sectors */
42 sector_t chunk_mask;
43 } prev, geo;
44 int copies; /* near_copies * far_copies.
45 * must be <= raid_disks
46 */
47
48 sector_t dev_sectors; /* temp copy of
49 * mddev->dev_sectors */
50 sector_t reshape_progress;
51 sector_t reshape_safe;
52 unsigned long reshape_checkpoint;
53 sector_t offset_diff;
54
55 struct list_head retry_list;
56 /* queue pending writes and submit them on unplug */
57 struct bio_list pending_bio_list;
58 int pending_count;
59
60 spinlock_t resync_lock;
61 int nr_pending;
62 int nr_waiting;
63 int nr_queued;
64 int barrier;
65 sector_t next_resync;
66 int fullsync; /* set to 1 if a full sync is needed,
67 * (fresh device added).
68 * Cleared when a sync completes.
69 */
70 int have_replacement; /* There is at least one
71 * replacement device.
72 */
73 wait_queue_head_t wait_barrier;
74
75 mempool_t *r10bio_pool;
76 mempool_t *r10buf_pool;
77 struct page *tmppage;
78
79 /* When taking over an array from a different personality, we store
80 * the new thread here until we fully activate the array.
81 */
82 struct md_thread *thread;
83};
84
85/*
86 * this is our 'private' RAID10 bio.
87 *
88 * it contains information about what kind of IO operations were started
89 * for this RAID10 operation, and about their status:
90 */
91
92struct r10bio {
93 atomic_t remaining; /* 'have we finished' count,
94 * used from IRQ handlers
95 */
96 sector_t sector; /* virtual sector number */
97 int sectors;
98 unsigned long state;
99 struct mddev *mddev;
100 /*
101 * original bio going to /dev/mdx
102 */
103 struct bio *master_bio;
104 /*
105 * if the IO is in READ direction, then this is where we read
106 */
107 int read_slot;
108
109 struct list_head retry_list;
110 /*
111 * if the IO is in WRITE direction, then multiple bios are used,
112 * one for each copy.
113 * When resyncing we also use one for each copy.
114 * When reconstructing, we use 2 bios, one for read, one for write.
115 * We choose the number when they are allocated.
116 * We sometimes need an extra bio to write to the replacement.
117 */
118 struct r10dev {
119 struct bio *bio;
120 union {
121 struct bio *repl_bio; /* used for resync and
122 * writes */
123 struct md_rdev *rdev; /* used for reads
124 * (read_slot >= 0) */
125 };
126 sector_t addr;
127 int devnum;
128 } devs[0];
129};
130
131/* bits for r10bio.state */
132enum r10bio_state {
133 R10BIO_Uptodate,
134 R10BIO_IsSync,
135 R10BIO_IsRecover,
136 R10BIO_IsReshape,
137 R10BIO_Degraded,
138/* Set ReadError on bios that experience a read error
139 * so that raid10d knows what to do with them.
140 */
141 R10BIO_ReadError,
142/* If a write for this request means we can clear some
143 * known-bad-block records, we set this flag.
144 */
145 R10BIO_MadeGood,
146 R10BIO_WriteError,
147/* During a reshape we might be performing IO on the
148 * 'previous' part of the array, in which case this
149 * flag is set
150 */
151 R10BIO_Previous,
152};
153
154extern int md_raid10_congested(struct mddev *mddev, int bits);
155
156#endif