rust: rbtree: add RBTree::entry

This mirrors the entry API [1] from the Rust standard library on
`RBTree`. This API can be used to access the entry at a specific key and
make modifications depending on whether the key is vacant or occupied.
This API is useful because it can often be used to avoid traversing the
tree multiple times.

This is used by binder to look up and conditionally access or insert a
value, depending on whether it is there or not [2].

Link: https://doc.rust-lang.org/stable/std/collections/btree_map/enum.Entry.html [1]
Link: https://android-review.googlesource.com/c/kernel/common/+/2849906 [2]
Signed-off-by: Alice Ryhl <aliceryhl@google.com>
Tested-by: Alice Ryhl <aliceryhl@google.com>
Reviewed-by: Boqun Feng <boqun.feng@gmail.com>
Reviewed-by: Benno Lossin <benno.lossin@proton.me>
Signed-off-by: Matt Gilbride <mattgilbride@google.com>
Link: https://lore.kernel.org/r/20240822-b4-rbtree-v12-5-014561758a57@google.com
Signed-off-by: Miguel Ojeda <ojeda@kernel.org>
This commit is contained in:
Alice Ryhl 2024-08-22 16:37:57 +00:00 committed by Miguel Ojeda
parent 98c14e40e0
commit a335e95914

View File

@ -293,12 +293,19 @@ where
/// key/value pair). Returns [`None`] if a node with the same key didn't already exist. /// key/value pair). Returns [`None`] if a node with the same key didn't already exist.
/// ///
/// This function always succeeds. /// This function always succeeds.
pub fn insert(&mut self, RBTreeNode { node }: RBTreeNode<K, V>) -> Option<RBTreeNode<K, V>> { pub fn insert(&mut self, node: RBTreeNode<K, V>) -> Option<RBTreeNode<K, V>> {
let node = Box::into_raw(node); match self.raw_entry(&node.node.key) {
// SAFETY: `node` is valid at least until we call `Box::from_raw`, which only happens when RawEntry::Occupied(entry) => Some(entry.replace(node)),
// the node is removed or replaced. RawEntry::Vacant(entry) => {
let node_links = unsafe { addr_of_mut!((*node).links) }; entry.insert(node);
None
}
}
}
fn raw_entry(&mut self, key: &K) -> RawEntry<'_, K, V> {
let raw_self: *mut RBTree<K, V> = self;
// The returned `RawEntry` is used to call either `rb_link_node` or `rb_replace_node`.
// The parameters of `bindings::rb_link_node` are as follows: // The parameters of `bindings::rb_link_node` are as follows:
// - `node`: A pointer to an uninitialized node being inserted. // - `node`: A pointer to an uninitialized node being inserted.
// - `parent`: A pointer to an existing node in the tree. One of its child pointers must be // - `parent`: A pointer to an existing node in the tree. One of its child pointers must be
@ -317,62 +324,56 @@ where
// in the subtree of `parent` that `child_field_of_parent` points at. Once // in the subtree of `parent` that `child_field_of_parent` points at. Once
// we find an empty subtree, we can insert the new node using `rb_link_node`. // we find an empty subtree, we can insert the new node using `rb_link_node`.
let mut parent = core::ptr::null_mut(); let mut parent = core::ptr::null_mut();
let mut child_field_of_parent: &mut *mut bindings::rb_node = &mut self.root.rb_node; let mut child_field_of_parent: &mut *mut bindings::rb_node =
while !child_field_of_parent.is_null() { // SAFETY: `raw_self` is a valid pointer to the `RBTree` (created from `self` above).
parent = *child_field_of_parent; unsafe { &mut (*raw_self).root.rb_node };
while !(*child_field_of_parent).is_null() {
let curr = *child_field_of_parent;
// SAFETY: All links fields we create are in a `Node<K, V>`.
let node = unsafe { container_of!(curr, Node<K, V>, links) };
// We need to determine whether `node` should be the left or right child of `parent`, // SAFETY: `node` is a non-null node so it is valid by the type invariants.
// so we will compare with the `key` field of `parent` a.k.a. `this` below. match key.cmp(unsafe { &(*node).key }) {
// // SAFETY: `curr` is a non-null node so it is valid by the type invariants.
// SAFETY: By the type invariant of `Self`, all non-null `rb_node` pointers stored in `self` Ordering::Less => child_field_of_parent = unsafe { &mut (*curr).rb_left },
// point to the links field of `Node<K, V>` objects. // SAFETY: `curr` is a non-null node so it is valid by the type invariants.
let this = unsafe { container_of!(parent, Node<K, V>, links) }; Ordering::Greater => child_field_of_parent = unsafe { &mut (*curr).rb_right },
// SAFETY: `this` is a non-null node so it is valid by the type invariants. `node` is
// valid until the node is removed.
match unsafe { (*node).key.cmp(&(*this).key) } {
// We would like `node` to be the left child of `parent`. Move to this child to check
// whether we can use it, or continue searching, at the next iteration.
//
// SAFETY: `parent` is a non-null node so it is valid by the type invariants.
Ordering::Less => child_field_of_parent = unsafe { &mut (*parent).rb_left },
// We would like `node` to be the right child of `parent`. Move to this child to check
// whether we can use it, or continue searching, at the next iteration.
//
// SAFETY: `parent` is a non-null node so it is valid by the type invariants.
Ordering::Greater => child_field_of_parent = unsafe { &mut (*parent).rb_right },
Ordering::Equal => { Ordering::Equal => {
// There is an existing node in the tree with this key, and that node is return RawEntry::Occupied(OccupiedEntry {
// `parent`. Thus, we are replacing parent with a new node. rbtree: self,
// node_links: curr,
// INVARIANT: We are replacing an existing node with a new one, which is valid. })
// It remains valid because we "forgot" it with `Box::into_raw`.
// SAFETY: All pointers are non-null and valid.
unsafe { bindings::rb_replace_node(parent, node_links, &mut self.root) };
// INVARIANT: The node is being returned and the caller may free it, however,
// it was removed from the tree. So the invariants still hold.
return Some(RBTreeNode {
// SAFETY: `this` was a node in the tree, so it is valid.
node: unsafe { Box::from_raw(this.cast_mut()) },
});
} }
} }
parent = curr;
} }
// INVARIANT: We are linking in a new node, which is valid. It remains valid because we RawEntry::Vacant(RawVacantEntry {
// "forgot" it with `Box::into_raw`. rbtree: raw_self,
// SAFETY: All pointers are non-null and valid (`*child_field_of_parent` is null, but `child_field_of_parent` is a parent,
// mutable reference). child_field_of_parent,
unsafe { bindings::rb_link_node(node_links, parent, child_field_of_parent) }; _phantom: PhantomData,
})
// SAFETY: All pointers are valid. `node` has just been inserted into the tree.
unsafe { bindings::rb_insert_color(node_links, &mut self.root) };
None
} }
/// Returns a node with the given key, if one exists. /// Gets the given key's corresponding entry in the map for in-place manipulation.
fn find(&self, key: &K) -> Option<NonNull<Node<K, V>>> { pub fn entry(&mut self, key: K) -> Entry<'_, K, V> {
match self.raw_entry(&key) {
RawEntry::Occupied(entry) => Entry::Occupied(entry),
RawEntry::Vacant(entry) => Entry::Vacant(VacantEntry { raw: entry, key }),
}
}
/// Used for accessing the given node, if it exists.
pub fn find_mut(&mut self, key: &K) -> Option<OccupiedEntry<'_, K, V>> {
match self.raw_entry(key) {
RawEntry::Occupied(entry) => Some(entry),
RawEntry::Vacant(_entry) => None,
}
}
/// Returns a reference to the value corresponding to the key.
pub fn get(&self, key: &K) -> Option<&V> {
let mut node = self.root.rb_node; let mut node = self.root.rb_node;
while !node.is_null() { while !node.is_null() {
// SAFETY: By the type invariant of `Self`, all non-null `rb_node` pointers stored in `self` // SAFETY: By the type invariant of `Self`, all non-null `rb_node` pointers stored in `self`
@ -384,47 +385,30 @@ where
Ordering::Less => unsafe { (*node).rb_left }, Ordering::Less => unsafe { (*node).rb_left },
// SAFETY: `node` is a non-null node so it is valid by the type invariants. // SAFETY: `node` is a non-null node so it is valid by the type invariants.
Ordering::Greater => unsafe { (*node).rb_right }, Ordering::Greater => unsafe { (*node).rb_right },
Ordering::Equal => return NonNull::new(this.cast_mut()), // SAFETY: `node` is a non-null node so it is valid by the type invariants.
Ordering::Equal => return Some(unsafe { &(*this).value }),
} }
} }
None None
} }
/// Returns a reference to the value corresponding to the key.
pub fn get(&self, key: &K) -> Option<&V> {
// SAFETY: The `find` return value is a node in the tree, so it is valid.
self.find(key).map(|node| unsafe { &node.as_ref().value })
}
/// Returns a mutable reference to the value corresponding to the key. /// Returns a mutable reference to the value corresponding to the key.
pub fn get_mut(&mut self, key: &K) -> Option<&mut V> { pub fn get_mut(&mut self, key: &K) -> Option<&mut V> {
// SAFETY: The `find` return value is a node in the tree, so it is valid. self.find_mut(key).map(|node| node.into_mut())
self.find(key)
.map(|mut node| unsafe { &mut node.as_mut().value })
} }
/// Removes the node with the given key from the tree. /// Removes the node with the given key from the tree.
/// ///
/// It returns the node that was removed if one exists, or [`None`] otherwise. /// It returns the node that was removed if one exists, or [`None`] otherwise.
fn remove_node(&mut self, key: &K) -> Option<RBTreeNode<K, V>> { pub fn remove_node(&mut self, key: &K) -> Option<RBTreeNode<K, V>> {
let mut node = self.find(key)?; self.find_mut(key).map(OccupiedEntry::remove_node)
// SAFETY: The `find` return value is a node in the tree, so it is valid.
unsafe { bindings::rb_erase(&mut node.as_mut().links, &mut self.root) };
// INVARIANT: The node is being returned and the caller may free it, however, it was
// removed from the tree. So the invariants still hold.
Some(RBTreeNode {
// SAFETY: The `find` return value was a node in the tree, so it is valid.
node: unsafe { Box::from_raw(node.as_ptr()) },
})
} }
/// Removes the node with the given key from the tree. /// Removes the node with the given key from the tree.
/// ///
/// It returns the value that was removed if one exists, or [`None`] otherwise. /// It returns the value that was removed if one exists, or [`None`] otherwise.
pub fn remove(&mut self, key: &K) -> Option<V> { pub fn remove(&mut self, key: &K) -> Option<V> {
self.remove_node(key).map(|node| node.node.value) self.find_mut(key).map(OccupiedEntry::remove)
} }
/// Returns a cursor over the tree nodes based on the given key. /// Returns a cursor over the tree nodes based on the given key.
@ -1117,6 +1101,177 @@ unsafe impl<K: Send, V: Send> Send for RBTreeNode<K, V> {}
// [`RBTreeNode`] without synchronization. // [`RBTreeNode`] without synchronization.
unsafe impl<K: Sync, V: Sync> Sync for RBTreeNode<K, V> {} unsafe impl<K: Sync, V: Sync> Sync for RBTreeNode<K, V> {}
impl<K, V> RBTreeNode<K, V> {
/// Drop the key and value, but keep the allocation.
///
/// It then becomes a reservation that can be re-initialised into a different node (i.e., with
/// a different key and/or value).
///
/// The existing key and value are dropped in-place as part of this operation, that is, memory
/// may be freed (but only for the key/value; memory for the node itself is kept for reuse).
pub fn into_reservation(self) -> RBTreeNodeReservation<K, V> {
RBTreeNodeReservation {
node: Box::drop_contents(self.node),
}
}
}
/// A view into a single entry in a map, which may either be vacant or occupied.
///
/// This enum is constructed from the [`RBTree::entry`].
///
/// [`entry`]: fn@RBTree::entry
pub enum Entry<'a, K, V> {
/// This [`RBTree`] does not have a node with this key.
Vacant(VacantEntry<'a, K, V>),
/// This [`RBTree`] already has a node with this key.
Occupied(OccupiedEntry<'a, K, V>),
}
/// Like [`Entry`], except that it doesn't have ownership of the key.
enum RawEntry<'a, K, V> {
Vacant(RawVacantEntry<'a, K, V>),
Occupied(OccupiedEntry<'a, K, V>),
}
/// A view into a vacant entry in a [`RBTree`]. It is part of the [`Entry`] enum.
pub struct VacantEntry<'a, K, V> {
key: K,
raw: RawVacantEntry<'a, K, V>,
}
/// Like [`VacantEntry`], but doesn't hold on to the key.
///
/// # Invariants
/// - `parent` may be null if the new node becomes the root.
/// - `child_field_of_parent` is a valid pointer to the left-child or right-child of `parent`. If `parent` is
/// null, it is a pointer to the root of the [`RBTree`].
struct RawVacantEntry<'a, K, V> {
rbtree: *mut RBTree<K, V>,
/// The node that will become the parent of the new node if we insert one.
parent: *mut bindings::rb_node,
/// This points to the left-child or right-child field of `parent`, or `root` if `parent` is
/// null.
child_field_of_parent: *mut *mut bindings::rb_node,
_phantom: PhantomData<&'a mut RBTree<K, V>>,
}
impl<'a, K, V> RawVacantEntry<'a, K, V> {
/// Inserts the given node into the [`RBTree`] at this entry.
///
/// The `node` must have a key such that inserting it here does not break the ordering of this
/// [`RBTree`].
fn insert(self, node: RBTreeNode<K, V>) -> &'a mut V {
let node = Box::into_raw(node.node);
// SAFETY: `node` is valid at least until we call `Box::from_raw`, which only happens when
// the node is removed or replaced.
let node_links = unsafe { addr_of_mut!((*node).links) };
// INVARIANT: We are linking in a new node, which is valid. It remains valid because we
// "forgot" it with `Box::into_raw`.
// SAFETY: The type invariants of `RawVacantEntry` are exactly the safety requirements of `rb_link_node`.
unsafe { bindings::rb_link_node(node_links, self.parent, self.child_field_of_parent) };
// SAFETY: All pointers are valid. `node` has just been inserted into the tree.
unsafe { bindings::rb_insert_color(node_links, addr_of_mut!((*self.rbtree).root)) };
// SAFETY: The node is valid until we remove it from the tree.
unsafe { &mut (*node).value }
}
}
impl<'a, K, V> VacantEntry<'a, K, V> {
/// Inserts the given node into the [`RBTree`] at this entry.
pub fn insert(self, value: V, reservation: RBTreeNodeReservation<K, V>) -> &'a mut V {
self.raw.insert(reservation.into_node(self.key, value))
}
}
/// A view into an occupied entry in a [`RBTree`]. It is part of the [`Entry`] enum.
///
/// # Invariants
/// - `node_links` is a valid, non-null pointer to a tree node in `self.rbtree`
pub struct OccupiedEntry<'a, K, V> {
rbtree: &'a mut RBTree<K, V>,
/// The node that this entry corresponds to.
node_links: *mut bindings::rb_node,
}
impl<'a, K, V> OccupiedEntry<'a, K, V> {
/// Gets a reference to the value in the entry.
pub fn get(&self) -> &V {
// SAFETY:
// - `self.node_links` is a valid pointer to a node in the tree.
// - We have shared access to the underlying tree, and can thus give out a shared reference.
unsafe { &(*container_of!(self.node_links, Node<K, V>, links)).value }
}
/// Gets a mutable reference to the value in the entry.
pub fn get_mut(&mut self) -> &mut V {
// SAFETY:
// - `self.node_links` is a valid pointer to a node in the tree.
// - We have exclusive access to the underlying tree, and can thus give out a mutable reference.
unsafe { &mut (*(container_of!(self.node_links, Node<K, V>, links).cast_mut())).value }
}
/// Converts the entry into a mutable reference to its value.
///
/// If you need multiple references to the `OccupiedEntry`, see [`self#get_mut`].
pub fn into_mut(self) -> &'a mut V {
// SAFETY:
// - `self.node_links` is a valid pointer to a node in the tree.
// - This consumes the `&'a mut RBTree<K, V>`, therefore it can give out a mutable reference that lives for `'a`.
unsafe { &mut (*(container_of!(self.node_links, Node<K, V>, links).cast_mut())).value }
}
/// Remove this entry from the [`RBTree`].
pub fn remove_node(self) -> RBTreeNode<K, V> {
// SAFETY: The node is a node in the tree, so it is valid.
unsafe { bindings::rb_erase(self.node_links, &mut self.rbtree.root) };
// INVARIANT: The node is being returned and the caller may free it, however, it was
// removed from the tree. So the invariants still hold.
RBTreeNode {
// SAFETY: The node was a node in the tree, but we removed it, so we can convert it
// back into a box.
node: unsafe {
Box::from_raw(container_of!(self.node_links, Node<K, V>, links).cast_mut())
},
}
}
/// Takes the value of the entry out of the map, and returns it.
pub fn remove(self) -> V {
self.remove_node().node.value
}
/// Swap the current node for the provided node.
///
/// The key of both nodes must be equal.
fn replace(self, node: RBTreeNode<K, V>) -> RBTreeNode<K, V> {
let node = Box::into_raw(node.node);
// SAFETY: `node` is valid at least until we call `Box::from_raw`, which only happens when
// the node is removed or replaced.
let new_node_links = unsafe { addr_of_mut!((*node).links) };
// SAFETY: This updates the pointers so that `new_node_links` is in the tree where
// `self.node_links` used to be.
unsafe {
bindings::rb_replace_node(self.node_links, new_node_links, &mut self.rbtree.root)
};
// SAFETY:
// - `self.node_ptr` produces a valid pointer to a node in the tree.
// - Now that we removed this entry from the tree, we can convert the node to a box.
let old_node =
unsafe { Box::from_raw(container_of!(self.node_links, Node<K, V>, links).cast_mut()) };
RBTreeNode { node: old_node }
}
}
struct Node<K, V> { struct Node<K, V> {
links: bindings::rb_node, links: bindings::rb_node,
key: K, key: K,