Commit 5d659bbb authored by Sidhartha Kumar's avatar Sidhartha Kumar Committed by Andrew Morton

maple_tree: introduce mas_wr_store_type()

Introduce mas_wr_store_type() which will set the correct store type based
on a walk of the tree.  In mas_wr_node_store() the <= min_slots condition
is changed to < as if new_end is = to mt_min_slots then there is not
enough room.

mas_prealloc_calc() is also introduced to abstract the calculation used to
determine the number of nodes needed for a store operation.

In this change a call to mas_reset() is removed in the error case of
mas_prealloc().  This is only needed in the MA_STATE_REBALANCE case of
mas_destroy().  We can move the call to mas_reset() directly to
mas_destroy().

Also, add a test case to validate the order that we check the store type
in is correct.  This test models a vma expanding and then shrinking which
is part of the boot process.

Link: https://lkml.kernel.org/r/20240814161944.55347-5-sidhartha.kumar@oracle.comSigned-off-by: default avatarSidhartha Kumar <sidhartha.kumar@oracle.com>
Cc: Liam R. Howlett <Liam.Howlett@oracle.com>
Cc: Matthew Wilcox (Oracle) <willy@infradead.org>
Cc: Suren Baghdasaryan <surenb@google.com>
Signed-off-by: default avatarAndrew Morton <akpm@linux-foundation.org>
parent 3cc6f42a
...@@ -1372,9 +1372,9 @@ static inline struct maple_enode *mas_start(struct ma_state *mas) ...@@ -1372,9 +1372,9 @@ static inline struct maple_enode *mas_start(struct ma_state *mas)
return NULL; return NULL;
} }
mas->node = NULL;
/* empty tree */ /* empty tree */
if (unlikely(!root)) { if (unlikely(!root)) {
mas->node = NULL;
mas->status = ma_none; mas->status = ma_none;
mas->offset = MAPLE_NODE_SLOTS; mas->offset = MAPLE_NODE_SLOTS;
return NULL; return NULL;
...@@ -3890,7 +3890,7 @@ static inline bool mas_wr_node_store(struct ma_wr_state *wr_mas, ...@@ -3890,7 +3890,7 @@ static inline bool mas_wr_node_store(struct ma_wr_state *wr_mas,
bool in_rcu = mt_in_rcu(mas->tree); bool in_rcu = mt_in_rcu(mas->tree);
/* Check if there is enough data. The room is enough. */ /* Check if there is enough data. The room is enough. */
if (!mte_is_root(mas->node) && (new_end <= mt_min_slots[wr_mas->type]) && if (!mte_is_root(mas->node) && (new_end < mt_min_slots[wr_mas->type]) &&
!(mas->mas_flags & MA_STATE_BULK)) !(mas->mas_flags & MA_STATE_BULK))
return false; return false;
...@@ -4275,6 +4275,146 @@ static inline void mas_wr_prealloc_setup(struct ma_wr_state *wr_mas) ...@@ -4275,6 +4275,146 @@ static inline void mas_wr_prealloc_setup(struct ma_wr_state *wr_mas)
wr_mas->content = mas_start(mas); wr_mas->content = mas_start(mas);
} }
/**
* mas_prealloc_calc() - Calculate number of nodes needed for a
* given store oepration
* @mas: The maple state
* @entry: The entry to store into the tree
*
* Return: Number of nodes required for preallocation.
*/
static inline int mas_prealloc_calc(struct ma_state *mas, void *entry)
{
int ret = mas_mt_height(mas) * 3 + 1;
switch (mas->store_type) {
case wr_invalid:
WARN_ON_ONCE(1);
break;
case wr_new_root:
ret = 1;
break;
case wr_store_root:
if (likely((mas->last != 0) || (mas->index != 0)))
ret = 1;
else if (((unsigned long) (entry) & 3) == 2)
ret = 1;
else
ret = 0;
break;
case wr_spanning_store:
ret = mas_mt_height(mas) * 3 + 1;
break;
case wr_split_store:
ret = mas_mt_height(mas) * 2 + 1;
break;
case wr_rebalance:
ret = mas_mt_height(mas) * 2 - 1;
break;
case wr_node_store:
ret = mt_in_rcu(mas->tree) ? 1 : 0;
break;
case wr_append:
case wr_exact_fit:
case wr_slot_store:
ret = 0;
}
return ret;
}
/*
* mas_wr_store_type() - Set the store type for a given
* store operation.
* @wr_mas: The maple write state
*/
static inline void mas_wr_store_type(struct ma_wr_state *wr_mas)
{
struct ma_state *mas = wr_mas->mas;
unsigned char new_end;
if (unlikely(mas_is_none(mas) || mas_is_ptr(mas))) {
mas->store_type = wr_store_root;
return;
}
if (unlikely(!mas_wr_walk(wr_mas))) {
mas->store_type = wr_spanning_store;
return;
}
/* At this point, we are at the leaf node that needs to be altered. */
mas_wr_end_piv(wr_mas);
if (!wr_mas->entry)
mas_wr_extend_null(wr_mas);
new_end = mas_wr_new_end(wr_mas);
if ((wr_mas->r_min == mas->index) && (wr_mas->r_max == mas->last)) {
mas->store_type = wr_exact_fit;
return;
}
if (unlikely(!mas->index && mas->last == ULONG_MAX)) {
mas->store_type = wr_new_root;
return;
}
/* Potential spanning rebalance collapsing a node */
if (new_end < mt_min_slots[wr_mas->type]) {
if (!mte_is_root(mas->node)) {
mas->store_type = wr_rebalance;
return;
}
mas->store_type = wr_node_store;
return;
}
if (new_end >= mt_slots[wr_mas->type]) {
mas->store_type = wr_split_store;
return;
}
if (!mt_in_rcu(mas->tree) && (mas->offset == mas->end)) {
mas->store_type = wr_append;
return;
}
if ((new_end == mas->end) && (!mt_in_rcu(mas->tree) ||
(wr_mas->offset_end - mas->offset == 1))) {
mas->store_type = wr_slot_store;
return;
}
if (mte_is_root(mas->node) || (new_end >= mt_min_slots[wr_mas->type]) ||
(mas->mas_flags & MA_STATE_BULK)) {
mas->store_type = wr_node_store;
return;
}
mas->store_type = wr_invalid;
MAS_WARN_ON(mas, 1);
}
/**
* mas_wr_preallocate() - Preallocate enough nodes for a store operation
* @wr_mas: The maple write state
* @entry: The entry that will be stored
*
*/
static inline void mas_wr_preallocate(struct ma_wr_state *wr_mas, void *entry)
{
struct ma_state *mas = wr_mas->mas;
int request;
mas_wr_prealloc_setup(wr_mas);
mas_wr_store_type(wr_mas);
request = mas_prealloc_calc(mas, entry);
if (!request)
return;
mas_node_count(mas, request);
}
/** /**
* mas_insert() - Internal call to insert a value * mas_insert() - Internal call to insert a value
* @mas: The maple state * @mas: The maple state
...@@ -5508,69 +5648,25 @@ EXPORT_SYMBOL_GPL(mas_store_prealloc); ...@@ -5508,69 +5648,25 @@ EXPORT_SYMBOL_GPL(mas_store_prealloc);
int mas_preallocate(struct ma_state *mas, void *entry, gfp_t gfp) int mas_preallocate(struct ma_state *mas, void *entry, gfp_t gfp)
{ {
MA_WR_STATE(wr_mas, mas, entry); MA_WR_STATE(wr_mas, mas, entry);
unsigned char node_size; int ret = 0;
int request = 1; int request;
int ret;
if (unlikely(!mas->index && mas->last == ULONG_MAX))
goto ask_now;
mas_wr_prealloc_setup(&wr_mas); mas_wr_prealloc_setup(&wr_mas);
/* Root expand */ mas_wr_store_type(&wr_mas);
if (unlikely(mas_is_none(mas) || mas_is_ptr(mas))) request = mas_prealloc_calc(mas, entry);
goto ask_now; if (!request)
return ret;
if (unlikely(!mas_wr_walk(&wr_mas))) {
/* Spanning store, use worst case for now */
request = 1 + mas_mt_height(mas) * 3;
goto ask_now;
}
/* At this point, we are at the leaf node that needs to be altered. */
/* Exact fit, no nodes needed. */
if (wr_mas.r_min == mas->index && wr_mas.r_max == mas->last)
return 0;
mas_wr_end_piv(&wr_mas);
node_size = mas_wr_new_end(&wr_mas);
/* Slot store, does not require additional nodes */
if (node_size == mas->end) {
/* reuse node */
if (!mt_in_rcu(mas->tree))
return 0;
/* shifting boundary */
if (wr_mas.offset_end - mas->offset == 1)
return 0;
}
if (node_size >= mt_slots[wr_mas.type]) { mas_node_count_gfp(mas, request, gfp);
/* Split, worst case for now. */ if (mas_is_err(mas)) {
request = 1 + mas_mt_height(mas) * 2; mas_set_alloc_req(mas, 0);
goto ask_now; ret = xa_err(mas->node);
mas_destroy(mas);
mas_reset(mas);
return ret;
} }
/* New root needs a single node */
if (unlikely(mte_is_root(mas->node)))
goto ask_now;
/* Potential spanning rebalance collapsing a node, use worst-case */
if (node_size - 1 <= mt_min_slots[wr_mas.type])
request = mas_mt_height(mas) * 2 - 1;
/* node store, slot store needs one node */
ask_now:
mas_node_count_gfp(mas, request, gfp);
mas->mas_flags |= MA_STATE_PREALLOC; mas->mas_flags |= MA_STATE_PREALLOC;
if (likely(!mas_is_err(mas)))
return 0;
mas_set_alloc_req(mas, 0);
ret = xa_err(mas->node);
mas_reset(mas);
mas_destroy(mas);
mas_reset(mas);
return ret; return ret;
} }
EXPORT_SYMBOL_GPL(mas_preallocate); EXPORT_SYMBOL_GPL(mas_preallocate);
...@@ -5596,7 +5692,8 @@ void mas_destroy(struct ma_state *mas) ...@@ -5596,7 +5692,8 @@ void mas_destroy(struct ma_state *mas)
*/ */
if (mas->mas_flags & MA_STATE_REBALANCE) { if (mas->mas_flags & MA_STATE_REBALANCE) {
unsigned char end; unsigned char end;
if (mas_is_err(mas))
mas_reset(mas);
mas_start(mas); mas_start(mas);
mtree_range_walk(mas); mtree_range_walk(mas);
end = mas->end + 1; end = mas->end + 1;
......
...@@ -36283,6 +36283,38 @@ static void check_nomem_writer_race(struct maple_tree *mt) ...@@ -36283,6 +36283,38 @@ static void check_nomem_writer_race(struct maple_tree *mt)
mtree_unlock(mt); mtree_unlock(mt);
} }
/* test to simulate expanding a vma from [0x7fffffffe000, 0x7ffffffff000)
* to [0x7ffde4ca1000, 0x7ffffffff000) and then shrinking the vma to
* [0x7ffde4ca1000, 0x7ffde4ca2000)
*/
static inline int check_vma_modification(struct maple_tree *mt)
{
MA_STATE(mas, mt, 0, 0);
mtree_lock(mt);
/* vma with old start and old end */
__mas_set_range(&mas, 0x7fffffffe000, 0x7ffffffff000 - 1);
mas_preallocate(&mas, xa_mk_value(1), GFP_KERNEL);
mas_store_prealloc(&mas, xa_mk_value(1));
/* next write occurs partly in previous range [0, 0x7fffffffe000)*/
mas_prev_range(&mas, 0);
/* expand vma to {0x7ffde4ca1000, 0x7ffffffff000) */
__mas_set_range(&mas, 0x7ffde4ca1000, 0x7ffffffff000 - 1);
mas_preallocate(&mas, xa_mk_value(1), GFP_KERNEL);
mas_store_prealloc(&mas, xa_mk_value(1));
/* shrink vma to [0x7ffde4ca1000, 7ffde4ca2000) */
__mas_set_range(&mas, 0x7ffde4ca2000, 0x7ffffffff000 - 1);
mas_preallocate(&mas, NULL, GFP_KERNEL);
mas_store_prealloc(&mas, NULL);
mt_dump(mt, mt_dump_hex);
mas_destroy(&mas);
mtree_unlock(mt);
return 0;
}
void farmer_tests(void) void farmer_tests(void)
{ {
struct maple_node *node; struct maple_node *node;
...@@ -36290,6 +36322,10 @@ void farmer_tests(void) ...@@ -36290,6 +36322,10 @@ void farmer_tests(void)
mt_dump(&tree, mt_dump_dec); mt_dump(&tree, mt_dump_dec);
mt_init_flags(&tree, MT_FLAGS_ALLOC_RANGE | MT_FLAGS_LOCK_EXTERN | MT_FLAGS_USE_RCU);
check_vma_modification(&tree);
mtree_destroy(&tree);
tree.ma_root = xa_mk_value(0); tree.ma_root = xa_mk_value(0);
mt_dump(&tree, mt_dump_dec); mt_dump(&tree, mt_dump_dec);
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment