diff options
| author | Chi-Kuan Chiu <105687635+devarajabc@users.noreply.github.com> | 2024-11-26 00:08:05 +0800 |
|---|---|---|
| committer | GitHub <noreply@github.com> | 2024-11-25 17:08:05 +0100 |
| commit | dcf196c2ae1ddddc8c6eb7a6ad5066c39dc954de (patch) | |
| tree | 739a9b7f01190a21a67980ddec8b218adeae5190 /src/include | |
| parent | a71856801b2a9f36a8745d0285778e6654a3408d (diff) | |
| download | box64-dcf196c2ae1ddddc8c6eb7a6ad5066c39dc954de.tar.gz box64-dcf196c2ae1ddddc8c6eb7a6ad5066c39dc954de.zip | |
[RBTREE] Document the rationale for memory management (#2060)
Enhanced the rbtree.h header with detailed documentation comments for each function. This comment aims to clarify the role of the red-black tree in memory management and how these functions interact with and manage memory.
Diffstat (limited to 'src/include')
| -rw-r--r-- | src/include/rbtree.h | 199 |
1 files changed, 199 insertions, 0 deletions
diff --git a/src/include/rbtree.h b/src/include/rbtree.h index e2b684cb..00a7a87a 100644 --- a/src/include/rbtree.h +++ b/src/include/rbtree.h @@ -1,3 +1,27 @@ +/* + * The primary function of red-black trees in Box64 is to provide a fast and efficient method (O(log(n))) for managing memory mappings. + * Each red-black tree node includes two additional pointers, "start" and "end," to denote a specific memory range. + * When a range of memory is mapped from the system, it is recorded in red-black trees based on the type and characteristics of that memory range. + * + * Box64 utilizes four red-black trees, each serving distinct purposes: + * 1. memprot: Manages memory protection settings where each node's data field represents the permissions of the memory range. + * The "rb_set" function within this tree can set or change permissions for a specified range. + * 2. mapallmem: Tracks all memory mappings. Its nodes' data field can indicate whether the memory is included in this mapping. + * 3. mmapmem: Similar to "mapallmem" but specifically for memory mapped through the mmap system call. + * The nodes' data fields here differentiate whether the memory is exclusively mapped by mmap. + * 4. blockstree: Specifically contains memory ranges for blocks, where each node represents a different block. + * The "data" field in this tree represents the index of the block in the "blocklist_s" array "p_blocks". + * + * Currently, there is an overlap between "mapallmem" and "mmapmem", where if memory is mapped in "mmapmem", it is also considered mapped in "mapallmem". + * If "mapallmem" and "mmapmem" were to be merged in the future, the "data" field could then take values indicating: + * - 0: Memory is not mapped. + * - 1: Memory is only mapped in "mapallmem". + * - 2: Memory is mapped in both "mapallmem" and "mmapmem". + * + * Before the introduction of the red-black tree in Box64, the rationale for memory management was a sparse array, which takes O(n) complexity for accessing data. + * After transitioning from a sparse array to a red-black tree, the memory usage has decreased slightly for processes that consumed a lot of RAM (for example, Steam uses about 100 MB less memory, and each Wine process uses about 15 MB less). + */ + #ifndef RBTREE_H #define RBTREE_H @@ -5,13 +29,188 @@ typedef struct rbtree rbtree_t; +/** + * rbtree_init() - Initializes a new red-black tree. + * @name: The name of the red-black tree. If null, the default name "(rbtree)" is assigned. + * + * This function allocates memory for a new red-black tree and initializes its properties. + * Return: A pointer to the newly created red-black tree. + */ rbtree_t* rbtree_init(const char* name); + +/** + * rbtree_delete() - Deletes an entire red-black tree. + * @tree: Pointer to the red-black tree to delete. + * + * This function recursively deletes all nodes in the red-black tree starting from the root + * and then frees the memory of the tree structure itself via delete_rbnode(). + */ void rbtree_delete(rbtree_t* tree); +/** + * rb_get() - Retrieves data associated with a specific address in the red-black tree. + * @tree: Pointer to the red-black tree from which data is to be retrieved. + * @addr: The memory address used as a key to find the corresponding node in the tree. + * + * This function searches the red-black tree for a node that corresponds to the specified address. + * Return: The data associated with the address if found; otherwise, 0. + */ uint32_t rb_get(rbtree_t* tree, uintptr_t addr); + +/** + * rb_get_end() - Searches for a node within a specified address range in a red-black tree and retrieves its data and end address. + * @tree: Pointer to the red-black tree to be searched. + * @addr: The address to search for within the nodes of the red-black tree. + * @val: Pointer to store the data of the node that contains the address if found. + * @end: Pointer to store the end address of the node that contains the address, or the start of the next node if not found, or UINTPTR_MAX if no next node exists. + * + * This function traverses the red-black tree starting from the root, searching for a node where the 'addr' falls between the node's start and end addresses (exclusive of end). + * If such a node is found, the function stores the node's data in '*val' and the node's end address in '*end', then returns 1 to indicate success. + * If no such node is found, the function sets '*val' to 0 and '*end' to the start address of the next node in the tree structure or to UINTPTR_MAX if there is no subsequent node. + * Return: 1 if a node containing the address is found, otherwise 0. + */ int rb_get_end(rbtree_t* tree, uintptr_t addr, uint32_t* val, uintptr_t* end); + +/** + * rb_set() - Set an address range in a red-black tree. + * @tree: Pointer to the red-black tree where the address range will be set. + * @start: The starting address of the range to be set. + * @end: The ending address of the range to be set. + * @data: The data value to associate with the address range. + * + * This function adds a new address range with associated data to the red-black tree. + * However, it is not always necessary to create a new node for each new address. + * If the range is adjacent to the existing nodes with the same data, the existing nodes will be extended to contain the new address. + * +---------+---------+---------+ +---------+---------+ + * | data A | | data A | + * +---------+---------+---------+ +---------+---------+ + * + * || + * \||/ + * \/ + * + * +---------+---------+---------+---------+---------+ + * | data A | + * +---------+---------+---------+---------+---------+ + * + * If the range overlaps with existing nodes, it will merge or modify nodes to maintain non-overlapping, contiguous ranges. + * This includes extending, splitting, or merging nodes based on the overlap conditions and data consistency. + * It handles multiple edge cases: + * 1. Overlap with same data: The existing node will be extended. + * + * (Case 1: Partial Overlap) + * +---------+---------+---------+---------+---------+ + * | data A | + * +---------+---------+---------+---------+---------+ + * ^..... overlap .....^ + * +---------+---------+---------+---------+---------+ + * | data A | + * +---------+---------+---------+---------+---------+ + * + * || + * \||/ Extend A + * \/ + * + * +---------+---------+---------+---------+---------+---------+---------+ + * | data A | + * +---------+---------+---------+---------+---------+---------+---------+ + * + * (Case 2: Overlap on Both Ends) + * +---------+---------+---------+---------+---------+ + * | data A | + * +---------+---------+---------+---------+---------+ + * ^..... overlap .....^ + * +---------+---------+---------+ + * | data A | + * +---------+---------+---------+ + * + * || + * \||/ Do nothing + * \/ + * + * +---------+---------+---------+---------+---------+ + * | data A | + * +---------+---------+---------+---------+---------+ + * + * + * 2. Overlap with different data: The overlapped part will be overwritten with the data from the new address range. + * The following graph shows that memory B is going to be added to the red-black tree where memory B overlaps with the existing node memory A. + * + * (Case 1: Overlap on Both Ends) + * +---------+---------+---------+---------+---------+ + * | data A | + * +---------+---------+---------+---------+---------+ + * ^..... overlap .....^ + * +---------+---------+---------+ + * | data B | + * +---------+---------+---------+ + * + * || + * \||/ Split the existing node into three new nodes + * \/ + * + * +---------+ +---------+---------+---------+ +---------+ + * | data A | | data B | | data A | + * +---------+ +---------+---------+---------+ +---------+ + * + * (Case 2: Partial Overlap) + * +---------+---------+---------+---------+---------+ + * | data A | + * +---------+---------+---------+---------+---------+ + * ^..... overlap .....^ + * +---------+---------+---------+---------+---------+ + * | data B | + * +---------+---------+---------+---------+---------+ + * + * || + * \||/ Adjust A by changing the pointers to exclude the segments that overlap with B + * \/ + * + * +---------+---------+ +---------+---------+---------+---------+---------+ + * | data A | | data B | + * +---------+---------+ +---------+---------+---------+---------+---------+ + * + * (Case 3: Complete Encapsulation) + * +---------+---------+---------+ + * | data A | + * +---------+---------+---------+ + * + * || + * \||/ Remove A entirely + * \/ + * +---------+---------+---------+---------+---------+ + * | data B | + * +---------+---------+---------+---------+---------+ + * + * The function ensures the tree remains balanced and correctly represents the address space with minimal nodes. + * + * Return: 0 on success, or -1 on failure. + */ int rb_set(rbtree_t* tree, uintptr_t start, uintptr_t end, uint32_t data); + +/** + * rb_unset() - Removes a range of values from the red-black tree. + * @tree: Pointer to the red-black tree. + * @start: The start address of the range to remove. + * @end: The end address of the range to remove. + * + * This function removes or adjusts nodes in the red-black tree that overlap with the specified + * range [start, end). It traverses the tree to find overlapping nodes, removes entire nodes + * that are completely within the range, and modifies nodes that partially overlap by adjusting + * their start or end values accordingly. + * + * Return: 0 on success. + */ int rb_unset(rbtree_t* tree, uintptr_t start, uintptr_t end); + +/** + * rb_get_righter() - Retrieves the start value of the right-most node in a red-black tree. + * @tree: Pointer to the red-black tree whose right-most node's start value is to be retrieved. + * + * This function traverses the red-black tree from the root to the right-most node, which is the node + * with the highest key value in the tree. + * Return: The start value of the right-most node if the tree is not empty; otherwise, 0. + */ uintptr_t rb_get_righter(rbtree_t* tree); #endif // RBTREE_H |