blob: 53a0633c6ef731d2e16cec67a5338acb18937eb7 [file] [log] [blame]
Greg Kroah-Hartmanb2441312017-11-01 15:07:57 +01001// SPDX-License-Identifier: GPL-2.0
Chris Masond1310b22008-01-24 16:13:08 -05002#include <linux/err.h>
Chris Masond1310b22008-01-24 16:13:08 -05003#include <linux/slab.h>
Chris Masona52d9a82007-08-27 16:49:44 -04004#include <linux/spinlock.h>
Li Zefan261507a02010-12-17 14:21:50 +08005#include "ctree.h"
Chris Masona52d9a82007-08-27 16:49:44 -04006#include "extent_map.h"
Anand Jainebb87652016-03-10 17:26:59 +08007#include "compression.h"
Chris Masona52d9a82007-08-27 16:49:44 -04008
Chris Mason86479a02007-09-10 19:58:16 -04009
Chris Masona52d9a82007-08-27 16:49:44 -040010static struct kmem_cache *extent_map_cache;
Chris Masonca664622007-11-27 11:16:35 -050011
Wyatt Banks2f4cbe62007-11-19 10:22:33 -050012int __init extent_map_init(void)
Chris Masona52d9a82007-08-27 16:49:44 -040013{
David Sterba837e1972012-09-07 03:00:48 -060014 extent_map_cache = kmem_cache_create("btrfs_extent_map",
Christoph Hellwig9601e3f2009-04-13 15:33:09 +020015 sizeof(struct extent_map), 0,
Nikolay Borisovfba4b692016-06-23 21:17:08 +030016 SLAB_MEM_SPREAD, NULL);
Wyatt Banks2f4cbe62007-11-19 10:22:33 -050017 if (!extent_map_cache)
18 return -ENOMEM;
Wyatt Banks2f4cbe62007-11-19 10:22:33 -050019 return 0;
Chris Masona52d9a82007-08-27 16:49:44 -040020}
21
David Sterbae67c7182018-02-19 17:24:18 +010022void __cold extent_map_exit(void)
Chris Masona52d9a82007-08-27 16:49:44 -040023{
Kinglong Mee5598e902016-01-29 21:36:35 +080024 kmem_cache_destroy(extent_map_cache);
Chris Masona52d9a82007-08-27 16:49:44 -040025}
26
Christoph Hellwig9d2423c2008-06-11 21:52:17 -040027/**
28 * extent_map_tree_init - initialize extent map tree
29 * @tree: tree to initialize
Christoph Hellwig9d2423c2008-06-11 21:52:17 -040030 *
31 * Initialize the extent tree @tree. Should be called for each new inode
32 * or other user of the extent_map interface.
33 */
David Sterbaa8067e02011-04-21 00:34:43 +020034void extent_map_tree_init(struct extent_map_tree *tree)
Chris Masona52d9a82007-08-27 16:49:44 -040035{
Eric Paris6bef4d32010-02-23 19:43:04 +000036 tree->map = RB_ROOT;
Josef Bacik5dc562c2012-08-17 13:14:17 -040037 INIT_LIST_HEAD(&tree->modified_extents);
Chris Mason890871b2009-09-02 16:24:52 -040038 rwlock_init(&tree->lock);
Chris Masona52d9a82007-08-27 16:49:44 -040039}
Chris Masona52d9a82007-08-27 16:49:44 -040040
Christoph Hellwig9d2423c2008-06-11 21:52:17 -040041/**
42 * alloc_extent_map - allocate new extent map structure
Christoph Hellwig9d2423c2008-06-11 21:52:17 -040043 *
44 * Allocate a new extent_map structure. The new structure is
45 * returned with a reference count of one and needs to be
46 * freed using free_extent_map()
47 */
David Sterba172ddd62011-04-21 00:48:27 +020048struct extent_map *alloc_extent_map(void)
Chris Masona52d9a82007-08-27 16:49:44 -040049{
50 struct extent_map *em;
Josef Bacik70c8a912012-10-11 16:54:30 -040051 em = kmem_cache_zalloc(extent_map_cache, GFP_NOFS);
Tsutomu Itohc26a9202011-02-14 00:45:29 +000052 if (!em)
53 return NULL;
Filipe Mananacbc0e922014-02-25 14:15:12 +000054 RB_CLEAR_NODE(&em->rb_node);
Chris Masond1310b22008-01-24 16:13:08 -050055 em->flags = 0;
Li Zefan261507a02010-12-17 14:21:50 +080056 em->compress_type = BTRFS_COMPRESS_NONE;
Josef Bacik5dc562c2012-08-17 13:14:17 -040057 em->generation = 0;
Elena Reshetova490b54d2017-03-03 10:55:12 +020058 refcount_set(&em->refs, 1);
Josef Bacik5dc562c2012-08-17 13:14:17 -040059 INIT_LIST_HEAD(&em->list);
Chris Masona52d9a82007-08-27 16:49:44 -040060 return em;
61}
Chris Masona52d9a82007-08-27 16:49:44 -040062
Christoph Hellwig9d2423c2008-06-11 21:52:17 -040063/**
64 * free_extent_map - drop reference count of an extent_map
Nicholas D Steeves01327612016-05-19 21:18:45 -040065 * @em: extent map being released
Christoph Hellwig9d2423c2008-06-11 21:52:17 -040066 *
67 * Drops the reference out on @em by one and free the structure
68 * if the reference count hits zero.
69 */
Chris Masona52d9a82007-08-27 16:49:44 -040070void free_extent_map(struct extent_map *em)
71{
Chris Mason2bf5a722007-08-30 11:54:02 -040072 if (!em)
73 return;
Elena Reshetova490b54d2017-03-03 10:55:12 +020074 WARN_ON(refcount_read(&em->refs) == 0);
75 if (refcount_dec_and_test(&em->refs)) {
Filipe Mananacbc0e922014-02-25 14:15:12 +000076 WARN_ON(extent_map_in_tree(em));
Josef Bacik5dc562c2012-08-17 13:14:17 -040077 WARN_ON(!list_empty(&em->list));
Wang Shilong298a8f92014-06-19 10:42:52 +080078 if (test_bit(EXTENT_FLAG_FS_MAPPING, &em->flags))
Jeff Mahoney95617d62015-06-03 10:55:48 -040079 kfree(em->map_lookup);
Chris Masona52d9a82007-08-27 16:49:44 -040080 kmem_cache_free(extent_map_cache, em);
81 }
82}
Chris Masona52d9a82007-08-27 16:49:44 -040083
Filipe David Borba Manana32193c12013-11-25 03:23:51 +000084/* simple helper to do math around the end of an extent, handling wrap */
85static u64 range_end(u64 start, u64 len)
86{
87 if (start + len < start)
88 return (u64)-1;
89 return start + len;
90}
91
92static int tree_insert(struct rb_root *root, struct extent_map *em)
Chris Masona52d9a82007-08-27 16:49:44 -040093{
Chris Masond3977122009-01-05 21:25:51 -050094 struct rb_node **p = &root->rb_node;
95 struct rb_node *parent = NULL;
Filipe David Borba Manana32193c12013-11-25 03:23:51 +000096 struct extent_map *entry = NULL;
97 struct rb_node *orig_parent = NULL;
98 u64 end = range_end(em->start, em->len);
Chris Masona52d9a82007-08-27 16:49:44 -040099
Chris Masond3977122009-01-05 21:25:51 -0500100 while (*p) {
Chris Masona52d9a82007-08-27 16:49:44 -0400101 parent = *p;
Chris Masond1310b22008-01-24 16:13:08 -0500102 entry = rb_entry(parent, struct extent_map, rb_node);
103
Filipe David Borba Manana32193c12013-11-25 03:23:51 +0000104 if (em->start < entry->start)
Chris Masona52d9a82007-08-27 16:49:44 -0400105 p = &(*p)->rb_left;
Filipe David Borba Manana32193c12013-11-25 03:23:51 +0000106 else if (em->start >= extent_map_end(entry))
Chris Masona52d9a82007-08-27 16:49:44 -0400107 p = &(*p)->rb_right;
108 else
Filipe David Borba Manana32193c12013-11-25 03:23:51 +0000109 return -EEXIST;
Chris Masona52d9a82007-08-27 16:49:44 -0400110 }
111
Filipe David Borba Manana32193c12013-11-25 03:23:51 +0000112 orig_parent = parent;
113 while (parent && em->start >= extent_map_end(entry)) {
114 parent = rb_next(parent);
115 entry = rb_entry(parent, struct extent_map, rb_node);
116 }
117 if (parent)
118 if (end > entry->start && em->start < extent_map_end(entry))
119 return -EEXIST;
120
121 parent = orig_parent;
122 entry = rb_entry(parent, struct extent_map, rb_node);
123 while (parent && em->start < entry->start) {
124 parent = rb_prev(parent);
125 entry = rb_entry(parent, struct extent_map, rb_node);
126 }
127 if (parent)
128 if (end > entry->start && em->start < extent_map_end(entry))
129 return -EEXIST;
130
Filipe David Borba Manana32193c12013-11-25 03:23:51 +0000131 rb_link_node(&em->rb_node, orig_parent, p);
132 rb_insert_color(&em->rb_node, root);
133 return 0;
Chris Masona52d9a82007-08-27 16:49:44 -0400134}
135
Chris Masond352ac62008-09-29 15:18:18 -0400136/*
137 * search through the tree for an extent_map with a given offset. If
138 * it can't be found, try to find some neighboring extents
139 */
Chris Masona52d9a82007-08-27 16:49:44 -0400140static struct rb_node *__tree_search(struct rb_root *root, u64 offset,
Chris Mason5f564062008-01-22 16:47:59 -0500141 struct rb_node **prev_ret,
142 struct rb_node **next_ret)
Chris Masona52d9a82007-08-27 16:49:44 -0400143{
Chris Masond3977122009-01-05 21:25:51 -0500144 struct rb_node *n = root->rb_node;
Chris Masona52d9a82007-08-27 16:49:44 -0400145 struct rb_node *prev = NULL;
Chris Mason5f564062008-01-22 16:47:59 -0500146 struct rb_node *orig_prev = NULL;
Chris Masond1310b22008-01-24 16:13:08 -0500147 struct extent_map *entry;
148 struct extent_map *prev_entry = NULL;
Chris Masona52d9a82007-08-27 16:49:44 -0400149
Chris Masond3977122009-01-05 21:25:51 -0500150 while (n) {
Chris Masond1310b22008-01-24 16:13:08 -0500151 entry = rb_entry(n, struct extent_map, rb_node);
Chris Masona52d9a82007-08-27 16:49:44 -0400152 prev = n;
153 prev_entry = entry;
154
155 if (offset < entry->start)
156 n = n->rb_left;
Chris Masond1310b22008-01-24 16:13:08 -0500157 else if (offset >= extent_map_end(entry))
Chris Masona52d9a82007-08-27 16:49:44 -0400158 n = n->rb_right;
159 else
160 return n;
161 }
Chris Mason5f564062008-01-22 16:47:59 -0500162
163 if (prev_ret) {
164 orig_prev = prev;
Chris Masond3977122009-01-05 21:25:51 -0500165 while (prev && offset >= extent_map_end(prev_entry)) {
Chris Mason5f564062008-01-22 16:47:59 -0500166 prev = rb_next(prev);
Chris Masond1310b22008-01-24 16:13:08 -0500167 prev_entry = rb_entry(prev, struct extent_map, rb_node);
Chris Mason5f564062008-01-22 16:47:59 -0500168 }
169 *prev_ret = prev;
170 prev = orig_prev;
Chris Masona52d9a82007-08-27 16:49:44 -0400171 }
Chris Mason5f564062008-01-22 16:47:59 -0500172
173 if (next_ret) {
Chris Masond1310b22008-01-24 16:13:08 -0500174 prev_entry = rb_entry(prev, struct extent_map, rb_node);
Chris Masond3977122009-01-05 21:25:51 -0500175 while (prev && offset < prev_entry->start) {
Chris Mason5f564062008-01-22 16:47:59 -0500176 prev = rb_prev(prev);
Chris Masond1310b22008-01-24 16:13:08 -0500177 prev_entry = rb_entry(prev, struct extent_map, rb_node);
Chris Mason5f564062008-01-22 16:47:59 -0500178 }
179 *next_ret = prev;
180 }
Chris Masona52d9a82007-08-27 16:49:44 -0400181 return NULL;
182}
183
Chris Masond352ac62008-09-29 15:18:18 -0400184/* check to see if two extent_map structs are adjacent and safe to merge */
Chris Masond1310b22008-01-24 16:13:08 -0500185static int mergable_maps(struct extent_map *prev, struct extent_map *next)
Chris Masona52d9a82007-08-27 16:49:44 -0400186{
Chris Mason7f3c74f2008-07-18 12:01:11 -0400187 if (test_bit(EXTENT_FLAG_PINNED, &prev->flags))
188 return 0;
189
Chris Masonc8b97812008-10-29 14:49:59 -0400190 /*
191 * don't merge compressed extents, we need to know their
192 * actual size
193 */
194 if (test_bit(EXTENT_FLAG_COMPRESSED, &prev->flags))
195 return 0;
196
Josef Bacik201a9032013-01-24 12:02:07 -0500197 if (test_bit(EXTENT_FLAG_LOGGING, &prev->flags) ||
198 test_bit(EXTENT_FLAG_LOGGING, &next->flags))
199 return 0;
200
Josef Bacik09a2a8f92013-04-05 16:51:15 -0400201 /*
202 * We don't want to merge stuff that hasn't been written to the log yet
203 * since it may not reflect exactly what is on disk, and that would be
204 * bad.
205 */
206 if (!list_empty(&prev->list) || !list_empty(&next->list))
207 return 0;
208
Chris Masond1310b22008-01-24 16:13:08 -0500209 if (extent_map_end(prev) == next->start &&
210 prev->flags == next->flags &&
211 prev->bdev == next->bdev &&
212 ((next->block_start == EXTENT_MAP_HOLE &&
213 prev->block_start == EXTENT_MAP_HOLE) ||
214 (next->block_start == EXTENT_MAP_INLINE &&
215 prev->block_start == EXTENT_MAP_INLINE) ||
216 (next->block_start == EXTENT_MAP_DELALLOC &&
217 prev->block_start == EXTENT_MAP_DELALLOC) ||
218 (next->block_start < EXTENT_MAP_LAST_BYTE - 1 &&
219 next->block_start == extent_map_block_end(prev)))) {
220 return 1;
221 }
Chris Masona52d9a82007-08-27 16:49:44 -0400222 return 0;
223}
224
Li Zefan4d2c8f622011-07-14 03:18:33 +0000225static void try_merge_map(struct extent_map_tree *tree, struct extent_map *em)
Chris Masona1ed8352009-09-11 12:27:37 -0400226{
Chris Masona1ed8352009-09-11 12:27:37 -0400227 struct extent_map *merge = NULL;
228 struct rb_node *rb;
Chris Masona1ed8352009-09-11 12:27:37 -0400229
230 if (em->start != 0) {
231 rb = rb_prev(&em->rb_node);
232 if (rb)
233 merge = rb_entry(rb, struct extent_map, rb_node);
234 if (rb && mergable_maps(merge, em)) {
235 em->start = merge->start;
Josef Bacik70c8a912012-10-11 16:54:30 -0400236 em->orig_start = merge->orig_start;
Chris Masona1ed8352009-09-11 12:27:37 -0400237 em->len += merge->len;
238 em->block_len += merge->block_len;
239 em->block_start = merge->block_start;
Josef Bacik70c8a912012-10-11 16:54:30 -0400240 em->mod_len = (em->mod_len + em->mod_start) - merge->mod_start;
241 em->mod_start = merge->mod_start;
242 em->generation = max(em->generation, merge->generation);
Josef Bacik5dc562c2012-08-17 13:14:17 -0400243
Chris Masona1ed8352009-09-11 12:27:37 -0400244 rb_erase(&merge->rb_node, &tree->map);
Filipe Mananacbc0e922014-02-25 14:15:12 +0000245 RB_CLEAR_NODE(&merge->rb_node);
Chris Masona1ed8352009-09-11 12:27:37 -0400246 free_extent_map(merge);
247 }
248 }
249
250 rb = rb_next(&em->rb_node);
251 if (rb)
252 merge = rb_entry(rb, struct extent_map, rb_node);
253 if (rb && mergable_maps(em, merge)) {
254 em->len += merge->len;
Filipe David Borba Mananad527afe2013-11-30 11:28:35 +0000255 em->block_len += merge->block_len;
Chris Masona1ed8352009-09-11 12:27:37 -0400256 rb_erase(&merge->rb_node, &tree->map);
Filipe Mananacbc0e922014-02-25 14:15:12 +0000257 RB_CLEAR_NODE(&merge->rb_node);
Josef Bacik70c8a912012-10-11 16:54:30 -0400258 em->mod_len = (merge->mod_start + merge->mod_len) - em->mod_start;
259 em->generation = max(em->generation, merge->generation);
Chris Masona1ed8352009-09-11 12:27:37 -0400260 free_extent_map(merge);
261 }
Li Zefan4d2c8f622011-07-14 03:18:33 +0000262}
263
Josef Bacik5dc562c2012-08-17 13:14:17 -0400264/**
Liu Bo52b1de92012-10-30 17:13:52 +0800265 * unpin_extent_cache - unpin an extent from the cache
Josef Bacik5dc562c2012-08-17 13:14:17 -0400266 * @tree: tree to unpin the extent in
267 * @start: logical offset in the file
268 * @len: length of the extent
269 * @gen: generation that this extent has been modified in
Josef Bacik5dc562c2012-08-17 13:14:17 -0400270 *
271 * Called after an extent has been written to disk properly. Set the generation
272 * to the generation that actually added the file item to the inode so we know
273 * we need to sync this extent when we call fsync().
274 */
275int unpin_extent_cache(struct extent_map_tree *tree, u64 start, u64 len,
276 u64 gen)
Li Zefan4d2c8f622011-07-14 03:18:33 +0000277{
278 int ret = 0;
279 struct extent_map *em;
Liu Bo4e2f84e2012-08-27 10:52:20 -0600280 bool prealloc = false;
Li Zefan4d2c8f622011-07-14 03:18:33 +0000281
282 write_lock(&tree->lock);
283 em = lookup_extent_mapping(tree, start, len);
284
285 WARN_ON(!em || em->start != start);
286
287 if (!em)
288 goto out;
289
Josef Bacik5dc562c2012-08-17 13:14:17 -0400290 em->generation = gen;
Li Zefan4d2c8f622011-07-14 03:18:33 +0000291 clear_bit(EXTENT_FLAG_PINNED, &em->flags);
Liu Bo4e2f84e2012-08-27 10:52:20 -0600292 em->mod_start = em->start;
293 em->mod_len = em->len;
294
Josef Bacikb11e2342012-12-03 10:58:15 -0500295 if (test_bit(EXTENT_FLAG_FILLING, &em->flags)) {
Liu Bo4e2f84e2012-08-27 10:52:20 -0600296 prealloc = true;
Josef Bacikb11e2342012-12-03 10:58:15 -0500297 clear_bit(EXTENT_FLAG_FILLING, &em->flags);
Liu Bo4e2f84e2012-08-27 10:52:20 -0600298 }
Li Zefan4d2c8f622011-07-14 03:18:33 +0000299
300 try_merge_map(tree, em);
Liu Bo4e2f84e2012-08-27 10:52:20 -0600301
302 if (prealloc) {
303 em->mod_start = em->start;
304 em->mod_len = em->len;
305 }
306
Chris Masona1ed8352009-09-11 12:27:37 -0400307 free_extent_map(em);
308out:
309 write_unlock(&tree->lock);
310 return ret;
311
312}
313
Josef Bacik201a9032013-01-24 12:02:07 -0500314void clear_em_logging(struct extent_map_tree *tree, struct extent_map *em)
315{
316 clear_bit(EXTENT_FLAG_LOGGING, &em->flags);
Filipe Mananacbc0e922014-02-25 14:15:12 +0000317 if (extent_map_in_tree(em))
Josef Bacik222c81d2013-01-28 09:45:20 -0500318 try_merge_map(tree, em);
Josef Bacik201a9032013-01-24 12:02:07 -0500319}
320
Filipe Manana176840b2014-02-25 14:15:13 +0000321static inline void setup_extent_mapping(struct extent_map_tree *tree,
322 struct extent_map *em,
323 int modified)
324{
Elena Reshetova490b54d2017-03-03 10:55:12 +0200325 refcount_inc(&em->refs);
Filipe Manana176840b2014-02-25 14:15:13 +0000326 em->mod_start = em->start;
327 em->mod_len = em->len;
328
329 if (modified)
330 list_move(&em->list, &tree->modified_extents);
331 else
332 try_merge_map(tree, em);
333}
334
Christoph Hellwig9d2423c2008-06-11 21:52:17 -0400335/**
336 * add_extent_mapping - add new extent map to the extent tree
337 * @tree: tree to insert new map in
338 * @em: map to insert
339 *
340 * Insert @em into @tree or perform a simple forward/backward merge with
341 * existing mappings. The extent_map struct passed in will be inserted
342 * into the tree directly, with an additional reference taken, or a
Lucas De Marchi25985ed2011-03-30 22:57:33 -0300343 * reference dropped if the merge attempt was successful.
Chris Masona52d9a82007-08-27 16:49:44 -0400344 */
345int add_extent_mapping(struct extent_map_tree *tree,
Josef Bacik09a2a8f92013-04-05 16:51:15 -0400346 struct extent_map *em, int modified)
Chris Masona52d9a82007-08-27 16:49:44 -0400347{
348 int ret = 0;
Chris Masona52d9a82007-08-27 16:49:44 -0400349
Filipe David Borba Manana32193c12013-11-25 03:23:51 +0000350 ret = tree_insert(&tree->map, em);
351 if (ret)
Chris Mason7c2fe322008-08-20 08:51:50 -0400352 goto out;
Filipe David Borba Manana32193c12013-11-25 03:23:51 +0000353
Filipe Manana176840b2014-02-25 14:15:13 +0000354 setup_extent_mapping(tree, em, modified);
Chris Masona52d9a82007-08-27 16:49:44 -0400355out:
Chris Masona52d9a82007-08-27 16:49:44 -0400356 return ret;
357}
Chris Masona52d9a82007-08-27 16:49:44 -0400358
Eric Sandeen48a3b632013-04-25 20:41:01 +0000359static struct extent_map *
360__lookup_extent_mapping(struct extent_map_tree *tree,
361 u64 start, u64 len, int strict)
Li Zefaned64f062011-07-14 03:18:15 +0000362{
363 struct extent_map *em;
364 struct rb_node *rb_node;
365 struct rb_node *prev = NULL;
366 struct rb_node *next = NULL;
367 u64 end = range_end(start, len);
368
369 rb_node = __tree_search(&tree->map, start, &prev, &next);
370 if (!rb_node) {
371 if (prev)
372 rb_node = prev;
373 else if (next)
374 rb_node = next;
375 else
376 return NULL;
377 }
378
379 em = rb_entry(rb_node, struct extent_map, rb_node);
380
381 if (strict && !(end > em->start && start < extent_map_end(em)))
382 return NULL;
383
Elena Reshetova490b54d2017-03-03 10:55:12 +0200384 refcount_inc(&em->refs);
Li Zefaned64f062011-07-14 03:18:15 +0000385 return em;
386}
387
Christoph Hellwig9d2423c2008-06-11 21:52:17 -0400388/**
389 * lookup_extent_mapping - lookup extent_map
390 * @tree: tree to lookup in
391 * @start: byte offset to start the search
392 * @len: length of the lookup range
393 *
394 * Find and return the first extent_map struct in @tree that intersects the
395 * [start, len] range. There may be additional objects in the tree that
396 * intersect, so check the object returned carefully to make sure that no
397 * additional lookups are needed.
Chris Masona52d9a82007-08-27 16:49:44 -0400398 */
399struct extent_map *lookup_extent_mapping(struct extent_map_tree *tree,
Chris Masond1310b22008-01-24 16:13:08 -0500400 u64 start, u64 len)
Chris Masona52d9a82007-08-27 16:49:44 -0400401{
Li Zefaned64f062011-07-14 03:18:15 +0000402 return __lookup_extent_mapping(tree, start, len, 1);
Chris Masona52d9a82007-08-27 16:49:44 -0400403}
Chris Masona52d9a82007-08-27 16:49:44 -0400404
Christoph Hellwig9d2423c2008-06-11 21:52:17 -0400405/**
Chris Masonb917b7c2009-09-18 16:07:03 -0400406 * search_extent_mapping - find a nearby extent map
407 * @tree: tree to lookup in
408 * @start: byte offset to start the search
409 * @len: length of the lookup range
410 *
411 * Find and return the first extent_map struct in @tree that intersects the
412 * [start, len] range.
413 *
414 * If one can't be found, any nearby extent may be returned
415 */
416struct extent_map *search_extent_mapping(struct extent_map_tree *tree,
417 u64 start, u64 len)
418{
Li Zefaned64f062011-07-14 03:18:15 +0000419 return __lookup_extent_mapping(tree, start, len, 0);
Chris Masonb917b7c2009-09-18 16:07:03 -0400420}
421
422/**
Christoph Hellwig9d2423c2008-06-11 21:52:17 -0400423 * remove_extent_mapping - removes an extent_map from the extent tree
424 * @tree: extent tree to remove from
Adam Buchbinderbb7ab3b2016-03-04 11:23:12 -0800425 * @em: extent map being removed
Christoph Hellwig9d2423c2008-06-11 21:52:17 -0400426 *
427 * Removes @em from @tree. No reference counts are dropped, and no checks
428 * are done to see if the range is in use
Chris Masona52d9a82007-08-27 16:49:44 -0400429 */
430int remove_extent_mapping(struct extent_map_tree *tree, struct extent_map *em)
431{
Chris Masond1310b22008-01-24 16:13:08 -0500432 int ret = 0;
Chris Masona52d9a82007-08-27 16:49:44 -0400433
Chris Mason7f3c74f2008-07-18 12:01:11 -0400434 WARN_ON(test_bit(EXTENT_FLAG_PINNED, &em->flags));
Chris Masond1310b22008-01-24 16:13:08 -0500435 rb_erase(&em->rb_node, &tree->map);
Josef Bacikff44c6e2012-09-14 12:59:20 -0400436 if (!test_bit(EXTENT_FLAG_LOGGING, &em->flags))
437 list_del_init(&em->list);
Filipe Mananacbc0e922014-02-25 14:15:12 +0000438 RB_CLEAR_NODE(&em->rb_node);
Chris Masona52d9a82007-08-27 16:49:44 -0400439 return ret;
440}
Filipe Manana176840b2014-02-25 14:15:13 +0000441
442void replace_extent_mapping(struct extent_map_tree *tree,
443 struct extent_map *cur,
444 struct extent_map *new,
445 int modified)
446{
447 WARN_ON(test_bit(EXTENT_FLAG_PINNED, &cur->flags));
448 ASSERT(extent_map_in_tree(cur));
449 if (!test_bit(EXTENT_FLAG_LOGGING, &cur->flags))
450 list_del_init(&cur->list);
451 rb_replace_node(&cur->rb_node, &new->rb_node, &tree->map);
452 RB_CLEAR_NODE(&cur->rb_node);
453
454 setup_extent_mapping(tree, new, modified);
455}
Liu Boc04e61b2018-01-05 12:51:11 -0700456
457static struct extent_map *next_extent_map(struct extent_map *em)
458{
459 struct rb_node *next;
460
461 next = rb_next(&em->rb_node);
462 if (!next)
463 return NULL;
464 return container_of(next, struct extent_map, rb_node);
465}
466
467static struct extent_map *prev_extent_map(struct extent_map *em)
468{
469 struct rb_node *prev;
470
471 prev = rb_prev(&em->rb_node);
472 if (!prev)
473 return NULL;
474 return container_of(prev, struct extent_map, rb_node);
475}
476
477/* helper for btfs_get_extent. Given an existing extent in the tree,
478 * the existing extent is the nearest extent to map_start,
479 * and an extent that you want to insert, deal with overlap and insert
480 * the best fitted new extent into the tree.
481 */
Liu Bo5f4791f2018-01-05 12:51:17 -0700482static noinline int merge_extent_mapping(struct extent_map_tree *em_tree,
483 struct extent_map *existing,
484 struct extent_map *em,
485 u64 map_start)
Liu Boc04e61b2018-01-05 12:51:11 -0700486{
487 struct extent_map *prev;
488 struct extent_map *next;
489 u64 start;
490 u64 end;
491 u64 start_diff;
492
493 BUG_ON(map_start < em->start || map_start >= extent_map_end(em));
494
495 if (existing->start > map_start) {
496 next = existing;
497 prev = prev_extent_map(next);
498 } else {
499 prev = existing;
500 next = next_extent_map(prev);
501 }
502
503 start = prev ? extent_map_end(prev) : em->start;
504 start = max_t(u64, start, em->start);
505 end = next ? next->start : extent_map_end(em);
506 end = min_t(u64, end, extent_map_end(em));
507 start_diff = start - em->start;
508 em->start = start;
509 em->len = end - start;
510 if (em->block_start < EXTENT_MAP_LAST_BYTE &&
511 !test_bit(EXTENT_FLAG_COMPRESSED, &em->flags)) {
512 em->block_start += start_diff;
513 em->block_len = em->len;
514 }
515 return add_extent_mapping(em_tree, em, 0);
516}
517
518/**
519 * btrfs_add_extent_mapping - add extent mapping into em_tree
520 * @em_tree - the extent tree into which we want to insert the extent mapping
521 * @em_in - extent we are inserting
522 * @start - start of the logical range btrfs_get_extent() is requesting
523 * @len - length of the logical range btrfs_get_extent() is requesting
524 *
525 * Note that @em_in's range may be different from [start, start+len),
526 * but they must be overlapped.
527 *
528 * Insert @em_in into @em_tree. In case there is an overlapping range, handle
529 * the -EEXIST by either:
530 * a) Returning the existing extent in @em_in if @start is within the
531 * existing em.
532 * b) Merge the existing extent with @em_in passed in.
533 *
534 * Return 0 on success, otherwise -EEXIST.
535 *
536 */
537int btrfs_add_extent_mapping(struct extent_map_tree *em_tree,
538 struct extent_map **em_in, u64 start, u64 len)
539{
540 int ret;
541 struct extent_map *em = *em_in;
542
543 ret = add_extent_mapping(em_tree, em, 0);
544 /* it is possible that someone inserted the extent into the tree
545 * while we had the lock dropped. It is also possible that
546 * an overlapping map exists in the tree
547 */
548 if (ret == -EEXIST) {
549 struct extent_map *existing;
550
551 ret = 0;
552
553 existing = search_extent_mapping(em_tree, start, len);
Liu Bo393da912018-01-05 12:51:16 -0700554
555 trace_btrfs_handle_em_exist(existing, em, start, len);
556
Liu Boc04e61b2018-01-05 12:51:11 -0700557 /*
558 * existing will always be non-NULL, since there must be
559 * extent causing the -EEXIST.
560 */
561 if (start >= existing->start &&
562 start < extent_map_end(existing)) {
563 free_extent_map(em);
564 *em_in = existing;
565 ret = 0;
566 } else {
Liu Bo9a7e10e2018-01-05 12:51:15 -0700567 u64 orig_start = em->start;
568 u64 orig_len = em->len;
569
Liu Boc04e61b2018-01-05 12:51:11 -0700570 /*
571 * The existing extent map is the one nearest to
572 * the [start, start + len) range which overlaps
573 */
574 ret = merge_extent_mapping(em_tree, existing,
575 em, start);
Liu Boc04e61b2018-01-05 12:51:11 -0700576 if (ret) {
577 free_extent_map(em);
578 *em_in = NULL;
Liu Bo9a7e10e2018-01-05 12:51:15 -0700579 WARN_ONCE(ret,
580"unexpected error %d: merge existing(start %llu len %llu) with em(start %llu len %llu)\n",
581 ret, existing->start, existing->len,
582 orig_start, orig_len);
Liu Boc04e61b2018-01-05 12:51:11 -0700583 }
Liu Bo9a7e10e2018-01-05 12:51:15 -0700584 free_extent_map(existing);
Liu Boc04e61b2018-01-05 12:51:11 -0700585 }
586 }
587
588 ASSERT(ret == 0 || ret == -EEXIST);
589 return ret;
590}