]>
Commit | Line | Data |
---|---|---|
0b86a832 CM |
1 | /* |
2 | * Copyright (C) 2007 Oracle. All rights reserved. | |
3 | * | |
4 | * This program is free software; you can redistribute it and/or | |
5 | * modify it under the terms of the GNU General Public | |
6 | * License v2 as published by the Free Software Foundation. | |
7 | * | |
8 | * This program is distributed in the hope that it will be useful, | |
9 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
10 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
11 | * General Public License for more details. | |
12 | * | |
13 | * You should have received a copy of the GNU General Public | |
14 | * License along with this program; if not, write to the | |
15 | * Free Software Foundation, Inc., 59 Temple Place - Suite 330, | |
16 | * Boston, MA 021110-1307, USA. | |
17 | */ | |
18 | ||
19 | #ifndef __BTRFS_VOLUMES_ | |
20 | #define __BTRFS_VOLUMES_ | |
8790d502 | 21 | |
cea9e445 | 22 | #include <linux/bio.h> |
b2117a39 | 23 | #include <linux/sort.h> |
55e301fd | 24 | #include <linux/btrfs.h> |
8b712842 | 25 | #include "async-thread.h" |
cea9e445 | 26 | |
b2117a39 MX |
27 | #define BTRFS_STRIPE_LEN (64 * 1024) |
28 | ||
f2984462 | 29 | struct buffer_head; |
ffbd517d CM |
30 | struct btrfs_pending_bios { |
31 | struct bio *head; | |
32 | struct bio *tail; | |
33 | }; | |
34 | ||
0b86a832 CM |
35 | struct btrfs_device { |
36 | struct list_head dev_list; | |
b3075717 | 37 | struct list_head dev_alloc_list; |
2b82032c | 38 | struct btrfs_fs_devices *fs_devices; |
0b86a832 | 39 | struct btrfs_root *dev_root; |
ffbd517d CM |
40 | |
41 | /* regular prio bios */ | |
42 | struct btrfs_pending_bios pending_bios; | |
43 | /* WRITE_SYNC bios */ | |
44 | struct btrfs_pending_bios pending_sync_bios; | |
45 | ||
dfe25020 | 46 | u64 generation; |
3c45bfc1 | 47 | int running_pending; |
2b82032c | 48 | int writeable; |
dfe25020 | 49 | int in_fs_metadata; |
cd02dca5 | 50 | int missing; |
d5e2003c | 51 | int can_discard; |
63a212ab | 52 | int is_tgtdev_for_dev_replace; |
b3075717 | 53 | |
8790d502 | 54 | spinlock_t io_lock; |
3c45bfc1 DG |
55 | /* the mode sent to blkdev_get */ |
56 | fmode_t mode; | |
0b86a832 CM |
57 | |
58 | struct block_device *bdev; | |
59 | ||
15916de8 | 60 | |
606686ee | 61 | struct rcu_string *name; |
8a4b83cc | 62 | |
0b86a832 CM |
63 | /* the internal btrfs device id */ |
64 | u64 devid; | |
65 | ||
66 | /* size of the device */ | |
67 | u64 total_bytes; | |
68 | ||
d6397bae CB |
69 | /* size of the disk */ |
70 | u64 disk_total_bytes; | |
71 | ||
0b86a832 CM |
72 | /* bytes used */ |
73 | u64 bytes_used; | |
74 | ||
75 | /* optimal io alignment for this device */ | |
76 | u32 io_align; | |
77 | ||
78 | /* optimal io width for this device */ | |
79 | u32 io_width; | |
3c45bfc1 DG |
80 | /* type and info about this device */ |
81 | u64 type; | |
0b86a832 CM |
82 | |
83 | /* minimal io size for this device */ | |
84 | u32 sector_size; | |
85 | ||
0b86a832 | 86 | |
0b86a832 | 87 | /* physical drive uuid (or lvm uuid) */ |
e17cade2 | 88 | u8 uuid[BTRFS_UUID_SIZE]; |
8b712842 | 89 | |
3c45bfc1 DG |
90 | /* for sending down flush barriers */ |
91 | int nobarriers; | |
92 | struct bio *flush_bio; | |
93 | struct completion flush_wait; | |
94 | ||
a2de733c | 95 | /* per-device scrub information */ |
d9d181c1 | 96 | struct scrub_ctx *scrub_device; |
a2de733c | 97 | |
d458b054 | 98 | struct btrfs_work work; |
1f78160c XG |
99 | struct rcu_head rcu; |
100 | struct work_struct rcu_work; | |
90519d66 AJ |
101 | |
102 | /* readahead state */ | |
103 | spinlock_t reada_lock; | |
104 | atomic_t reada_in_flight; | |
105 | u64 reada_next; | |
106 | struct reada_zone *reada_curr_zone; | |
107 | struct radix_tree_root reada_zones; | |
108 | struct radix_tree_root reada_extents; | |
387125fc | 109 | |
387125fc | 110 | |
442a4f63 SB |
111 | /* disk I/O failure stats. For detailed description refer to |
112 | * enum btrfs_dev_stat_values in ioctl.h */ | |
733f4fbb | 113 | int dev_stats_valid; |
442a4f63 SB |
114 | int dev_stats_dirty; /* counters need to be written to disk */ |
115 | atomic_t dev_stat_values[BTRFS_DEV_STAT_VALUES_MAX]; | |
0b86a832 CM |
116 | }; |
117 | ||
8a4b83cc CM |
118 | struct btrfs_fs_devices { |
119 | u8 fsid[BTRFS_FSID_SIZE]; /* FS specific uuid */ | |
120 | ||
d4a78947 | 121 | /* the device with this id has the most recent copy of the super */ |
8a4b83cc CM |
122 | u64 latest_devid; |
123 | u64 latest_trans; | |
8a4b83cc | 124 | u64 num_devices; |
a0af469b | 125 | u64 open_devices; |
2b82032c | 126 | u64 rw_devices; |
cd02dca5 | 127 | u64 missing_devices; |
2b82032c | 128 | u64 total_rw_bytes; |
d5e2003c | 129 | u64 num_can_discard; |
02db0844 | 130 | u64 total_devices; |
8a4b83cc | 131 | struct block_device *latest_bdev; |
e5e9a520 CM |
132 | |
133 | /* all of the devices in the FS, protected by a mutex | |
134 | * so we can safely walk it to write out the supers without | |
9b011adf WS |
135 | * worrying about add/remove by the multi-device code. |
136 | * Scrubbing super can kick off supers writing by holding | |
137 | * this mutex lock. | |
e5e9a520 CM |
138 | */ |
139 | struct mutex device_list_mutex; | |
8a4b83cc | 140 | struct list_head devices; |
b3075717 CM |
141 | |
142 | /* devices not currently being allocated */ | |
143 | struct list_head alloc_list; | |
8a4b83cc | 144 | struct list_head list; |
2b82032c YZ |
145 | |
146 | struct btrfs_fs_devices *seed; | |
147 | int seeding; | |
2b82032c YZ |
148 | |
149 | int opened; | |
c289811c CM |
150 | |
151 | /* set when we find or add a device that doesn't have the | |
152 | * nonrot flag set | |
153 | */ | |
154 | int rotating; | |
8a4b83cc CM |
155 | }; |
156 | ||
facc8a22 MX |
157 | #define BTRFS_BIO_INLINE_CSUM_SIZE 64 |
158 | ||
9be3395b CM |
159 | /* |
160 | * we need the mirror number and stripe index to be passed around | |
161 | * the call chain while we are processing end_io (especially errors). | |
162 | * Really, what we need is a btrfs_bio structure that has this info | |
163 | * and is properly sized with its stripe array, but we're not there | |
164 | * quite yet. We have our own btrfs bioset, and all of the bios | |
165 | * we allocate are actually btrfs_io_bios. We'll cram as much of | |
166 | * struct btrfs_bio as we can into this over time. | |
167 | */ | |
facc8a22 | 168 | typedef void (btrfs_io_bio_end_io_t) (struct btrfs_io_bio *bio, int err); |
9be3395b CM |
169 | struct btrfs_io_bio { |
170 | unsigned long mirror_num; | |
171 | unsigned long stripe_index; | |
facc8a22 MX |
172 | u8 *csum; |
173 | u8 csum_inline[BTRFS_BIO_INLINE_CSUM_SIZE]; | |
174 | u8 *csum_allocated; | |
175 | btrfs_io_bio_end_io_t *end_io; | |
9be3395b CM |
176 | struct bio bio; |
177 | }; | |
178 | ||
179 | static inline struct btrfs_io_bio *btrfs_io_bio(struct bio *bio) | |
180 | { | |
181 | return container_of(bio, struct btrfs_io_bio, bio); | |
182 | } | |
183 | ||
cea9e445 CM |
184 | struct btrfs_bio_stripe { |
185 | struct btrfs_device *dev; | |
186 | u64 physical; | |
fce3bb9a | 187 | u64 length; /* only used for discard mappings */ |
cea9e445 CM |
188 | }; |
189 | ||
a1d3c478 JS |
190 | struct btrfs_bio; |
191 | typedef void (btrfs_bio_end_io_t) (struct btrfs_bio *bio, int err); | |
192 | ||
c55f1396 MX |
193 | #define BTRFS_BIO_ORIG_BIO_SUBMITTED 0x1 |
194 | ||
a1d3c478 | 195 | struct btrfs_bio { |
cea9e445 | 196 | atomic_t stripes_pending; |
c404e0dc | 197 | struct btrfs_fs_info *fs_info; |
cea9e445 | 198 | bio_end_io_t *end_io; |
7d2b4daa | 199 | struct bio *orig_bio; |
c55f1396 | 200 | unsigned long flags; |
cea9e445 | 201 | void *private; |
a236aed1 CM |
202 | atomic_t error; |
203 | int max_errors; | |
cea9e445 | 204 | int num_stripes; |
a1d3c478 | 205 | int mirror_num; |
cea9e445 CM |
206 | struct btrfs_bio_stripe stripes[]; |
207 | }; | |
208 | ||
b2117a39 MX |
209 | struct btrfs_device_info { |
210 | struct btrfs_device *dev; | |
211 | u64 dev_offset; | |
212 | u64 max_avail; | |
73c5de00 | 213 | u64 total_avail; |
b2117a39 MX |
214 | }; |
215 | ||
31e50229 LB |
216 | struct btrfs_raid_attr { |
217 | int sub_stripes; /* sub_stripes info for map */ | |
218 | int dev_stripes; /* stripes per dev */ | |
219 | int devs_max; /* max devs to use */ | |
220 | int devs_min; /* min devs needed */ | |
221 | int devs_increment; /* ndevs has to be a multiple of this */ | |
222 | int ncopies; /* how many copies to data has */ | |
223 | }; | |
224 | ||
1abe9b8a | 225 | struct map_lookup { |
226 | u64 type; | |
227 | int io_align; | |
228 | int io_width; | |
229 | int stripe_len; | |
230 | int sector_size; | |
231 | int num_stripes; | |
232 | int sub_stripes; | |
233 | struct btrfs_bio_stripe stripes[]; | |
234 | }; | |
235 | ||
a2de733c AJ |
236 | #define map_lookup_size(n) (sizeof(struct map_lookup) + \ |
237 | (sizeof(struct btrfs_bio_stripe) * (n))) | |
238 | ||
f43ffb60 ID |
239 | /* |
240 | * Restriper's general type filter | |
241 | */ | |
242 | #define BTRFS_BALANCE_DATA (1ULL << 0) | |
243 | #define BTRFS_BALANCE_SYSTEM (1ULL << 1) | |
244 | #define BTRFS_BALANCE_METADATA (1ULL << 2) | |
245 | ||
246 | #define BTRFS_BALANCE_TYPE_MASK (BTRFS_BALANCE_DATA | \ | |
247 | BTRFS_BALANCE_SYSTEM | \ | |
248 | BTRFS_BALANCE_METADATA) | |
e4d8ec0f ID |
249 | |
250 | #define BTRFS_BALANCE_FORCE (1ULL << 3) | |
59641015 | 251 | #define BTRFS_BALANCE_RESUME (1ULL << 4) |
e4d8ec0f | 252 | |
ed25e9b2 ID |
253 | /* |
254 | * Balance filters | |
255 | */ | |
256 | #define BTRFS_BALANCE_ARGS_PROFILES (1ULL << 0) | |
5ce5b3c0 | 257 | #define BTRFS_BALANCE_ARGS_USAGE (1ULL << 1) |
409d404b | 258 | #define BTRFS_BALANCE_ARGS_DEVID (1ULL << 2) |
94e60d5a | 259 | #define BTRFS_BALANCE_ARGS_DRANGE (1ULL << 3) |
ea67176a | 260 | #define BTRFS_BALANCE_ARGS_VRANGE (1ULL << 4) |
7d824b6f | 261 | #define BTRFS_BALANCE_ARGS_LIMIT (1ULL << 5) |
f43ffb60 | 262 | |
cfa4c961 ID |
263 | /* |
264 | * Profile changing flags. When SOFT is set we won't relocate chunk if | |
265 | * it already has the target profile (even though it may be | |
266 | * half-filled). | |
267 | */ | |
e4d8ec0f | 268 | #define BTRFS_BALANCE_ARGS_CONVERT (1ULL << 8) |
cfa4c961 | 269 | #define BTRFS_BALANCE_ARGS_SOFT (1ULL << 9) |
e4d8ec0f | 270 | |
c9e9f97b | 271 | struct btrfs_balance_args; |
19a39dce | 272 | struct btrfs_balance_progress; |
c9e9f97b ID |
273 | struct btrfs_balance_control { |
274 | struct btrfs_fs_info *fs_info; | |
275 | ||
276 | struct btrfs_balance_args data; | |
277 | struct btrfs_balance_args meta; | |
278 | struct btrfs_balance_args sys; | |
279 | ||
280 | u64 flags; | |
19a39dce ID |
281 | |
282 | struct btrfs_balance_progress stat; | |
c9e9f97b ID |
283 | }; |
284 | ||
6d07bcec MX |
285 | int btrfs_account_dev_extents_size(struct btrfs_device *device, u64 start, |
286 | u64 end, u64 *length); | |
287 | ||
a1d3c478 | 288 | #define btrfs_bio_size(n) (sizeof(struct btrfs_bio) + \ |
cea9e445 CM |
289 | (sizeof(struct btrfs_bio_stripe) * (n))) |
290 | ||
3ec706c8 | 291 | int btrfs_map_block(struct btrfs_fs_info *fs_info, int rw, |
cea9e445 | 292 | u64 logical, u64 *length, |
a1d3c478 | 293 | struct btrfs_bio **bbio_ret, int mirror_num); |
a512bbf8 YZ |
294 | int btrfs_rmap_block(struct btrfs_mapping_tree *map_tree, |
295 | u64 chunk_start, u64 physical, u64 devid, | |
296 | u64 **logical, int *naddrs, int *stripe_len); | |
e4404d6e | 297 | int btrfs_read_sys_array(struct btrfs_root *root); |
0b86a832 CM |
298 | int btrfs_read_chunk_tree(struct btrfs_root *root); |
299 | int btrfs_alloc_chunk(struct btrfs_trans_handle *trans, | |
2b82032c | 300 | struct btrfs_root *extent_root, u64 type); |
0b86a832 CM |
301 | void btrfs_mapping_init(struct btrfs_mapping_tree *tree); |
302 | void btrfs_mapping_tree_free(struct btrfs_mapping_tree *tree); | |
f188591e | 303 | int btrfs_map_bio(struct btrfs_root *root, int rw, struct bio *bio, |
8b712842 | 304 | int mirror_num, int async_submit); |
8a4b83cc | 305 | int btrfs_open_devices(struct btrfs_fs_devices *fs_devices, |
97288f2c CH |
306 | fmode_t flags, void *holder); |
307 | int btrfs_scan_one_device(const char *path, fmode_t flags, void *holder, | |
8a4b83cc CM |
308 | struct btrfs_fs_devices **fs_devices_ret); |
309 | int btrfs_close_devices(struct btrfs_fs_devices *fs_devices); | |
8dabb742 SB |
310 | void btrfs_close_extra_devices(struct btrfs_fs_info *fs_info, |
311 | struct btrfs_fs_devices *fs_devices, int step); | |
7ba15b7d SB |
312 | int btrfs_find_device_missing_or_by_path(struct btrfs_root *root, |
313 | char *device_path, | |
314 | struct btrfs_device **device); | |
12bd2fc0 ID |
315 | struct btrfs_device *btrfs_alloc_device(struct btrfs_fs_info *fs_info, |
316 | const u64 *devid, | |
317 | const u8 *uuid); | |
a061fc8d | 318 | int btrfs_rm_device(struct btrfs_root *root, char *device_path); |
143bede5 | 319 | void btrfs_cleanup_fs_uuids(void); |
5d964051 | 320 | int btrfs_num_copies(struct btrfs_fs_info *fs_info, u64 logical, u64 len); |
8f18cf13 CM |
321 | int btrfs_grow_device(struct btrfs_trans_handle *trans, |
322 | struct btrfs_device *device, u64 new_size); | |
aa1b8cd4 | 323 | struct btrfs_device *btrfs_find_device(struct btrfs_fs_info *fs_info, u64 devid, |
2b82032c | 324 | u8 *uuid, u8 *fsid); |
8f18cf13 | 325 | int btrfs_shrink_device(struct btrfs_device *device, u64 new_size); |
788f20eb | 326 | int btrfs_init_new_device(struct btrfs_root *root, char *path); |
e93c89c1 SB |
327 | int btrfs_init_dev_replace_tgtdev(struct btrfs_root *root, char *device_path, |
328 | struct btrfs_device **device_out); | |
c9e9f97b ID |
329 | int btrfs_balance(struct btrfs_balance_control *bctl, |
330 | struct btrfs_ioctl_balance_args *bargs); | |
2b6ba629 | 331 | int btrfs_resume_balance_async(struct btrfs_fs_info *fs_info); |
68310a5e | 332 | int btrfs_recover_balance(struct btrfs_fs_info *fs_info); |
837d5b6e | 333 | int btrfs_pause_balance(struct btrfs_fs_info *fs_info); |
a7e99c69 | 334 | int btrfs_cancel_balance(struct btrfs_fs_info *fs_info); |
f7a81ea4 | 335 | int btrfs_create_uuid_tree(struct btrfs_fs_info *fs_info); |
70f80175 | 336 | int btrfs_check_uuid_tree(struct btrfs_fs_info *fs_info); |
2b82032c | 337 | int btrfs_chunk_readonly(struct btrfs_root *root, u64 chunk_offset); |
6df9a95e JB |
338 | int find_free_dev_extent(struct btrfs_trans_handle *trans, |
339 | struct btrfs_device *device, u64 num_bytes, | |
ba1bf481 | 340 | u64 *start, u64 *max_avail); |
442a4f63 | 341 | void btrfs_dev_stat_inc_and_print(struct btrfs_device *dev, int index); |
c11d2c23 | 342 | int btrfs_get_dev_stats(struct btrfs_root *root, |
b27f7c0c | 343 | struct btrfs_ioctl_get_dev_stats *stats); |
cb517eab | 344 | void btrfs_init_devices_late(struct btrfs_fs_info *fs_info); |
733f4fbb SB |
345 | int btrfs_init_dev_stats(struct btrfs_fs_info *fs_info); |
346 | int btrfs_run_dev_stats(struct btrfs_trans_handle *trans, | |
347 | struct btrfs_fs_info *fs_info); | |
e93c89c1 SB |
348 | void btrfs_rm_dev_replace_srcdev(struct btrfs_fs_info *fs_info, |
349 | struct btrfs_device *srcdev); | |
350 | void btrfs_destroy_dev_replace_tgtdev(struct btrfs_fs_info *fs_info, | |
351 | struct btrfs_device *tgtdev); | |
352 | void btrfs_init_dev_replace_tgtdev_for_resume(struct btrfs_fs_info *fs_info, | |
353 | struct btrfs_device *tgtdev); | |
a8a6dab7 | 354 | int btrfs_scratch_superblock(struct btrfs_device *device); |
53b381b3 DW |
355 | int btrfs_is_parity_mirror(struct btrfs_mapping_tree *map_tree, |
356 | u64 logical, u64 len, int mirror_num); | |
357 | unsigned long btrfs_full_stripe_len(struct btrfs_root *root, | |
358 | struct btrfs_mapping_tree *map_tree, | |
359 | u64 logical); | |
6df9a95e JB |
360 | int btrfs_finish_chunk_alloc(struct btrfs_trans_handle *trans, |
361 | struct btrfs_root *extent_root, | |
362 | u64 chunk_offset, u64 chunk_size); | |
442a4f63 SB |
363 | static inline void btrfs_dev_stat_inc(struct btrfs_device *dev, |
364 | int index) | |
365 | { | |
366 | atomic_inc(dev->dev_stat_values + index); | |
367 | dev->dev_stats_dirty = 1; | |
368 | } | |
369 | ||
370 | static inline int btrfs_dev_stat_read(struct btrfs_device *dev, | |
371 | int index) | |
372 | { | |
373 | return atomic_read(dev->dev_stat_values + index); | |
374 | } | |
375 | ||
376 | static inline int btrfs_dev_stat_read_and_reset(struct btrfs_device *dev, | |
377 | int index) | |
378 | { | |
379 | int ret; | |
380 | ||
381 | ret = atomic_xchg(dev->dev_stat_values + index, 0); | |
382 | dev->dev_stats_dirty = 1; | |
383 | return ret; | |
384 | } | |
385 | ||
386 | static inline void btrfs_dev_stat_set(struct btrfs_device *dev, | |
387 | int index, unsigned long val) | |
388 | { | |
389 | atomic_set(dev->dev_stat_values + index, val); | |
390 | dev->dev_stats_dirty = 1; | |
391 | } | |
392 | ||
393 | static inline void btrfs_dev_stat_reset(struct btrfs_device *dev, | |
394 | int index) | |
395 | { | |
396 | btrfs_dev_stat_set(dev, index, 0); | |
397 | } | |
0b86a832 | 398 | #endif |