2017-03-17 14:18:50 +08:00
|
|
|
/* SPDX-License-Identifier: GPL-2.0 */
|
|
|
|
#ifndef _EYTZINGER_H
|
|
|
|
#define _EYTZINGER_H
|
|
|
|
|
|
|
|
#include <linux/bitops.h>
|
|
|
|
#include <linux/log2.h>
|
|
|
|
|
2024-03-23 07:26:33 +08:00
|
|
|
#ifdef EYTZINGER_DEBUG
|
|
|
|
#define EYTZINGER_BUG_ON(cond) BUG_ON(cond)
|
|
|
|
#else
|
|
|
|
#define EYTZINGER_BUG_ON(cond)
|
|
|
|
#endif
|
2017-03-17 14:18:50 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Traversal for trees in eytzinger layout - a full binary tree layed out in an
|
2024-03-23 07:26:33 +08:00
|
|
|
* array.
|
2017-03-17 14:18:50 +08:00
|
|
|
*
|
2024-03-23 07:26:33 +08:00
|
|
|
* Consider using an eytzinger tree any time you would otherwise be doing binary
|
|
|
|
* search over an array. Binary search is a worst case scenario for branch
|
|
|
|
* prediction and prefetching, but in an eytzinger tree every node's children
|
|
|
|
* are adjacent in memory, thus we can prefetch children before knowing the
|
|
|
|
* result of the comparison, assuming multiple nodes fit on a cacheline.
|
|
|
|
*
|
|
|
|
* Two variants are provided, for one based indexing and zero based indexing.
|
|
|
|
*
|
|
|
|
* Zero based indexing is more convenient, but one based indexing has better
|
|
|
|
* alignment and thus better performance because each new level of the tree
|
|
|
|
* starts at a power of two, and thus if element 0 was cacheline aligned, each
|
|
|
|
* new level will be as well.
|
2017-03-17 14:18:50 +08:00
|
|
|
*/
|
|
|
|
|
|
|
|
static inline unsigned eytzinger1_child(unsigned i, unsigned child)
|
|
|
|
{
|
2024-03-23 07:26:33 +08:00
|
|
|
EYTZINGER_BUG_ON(child > 1);
|
2017-03-17 14:18:50 +08:00
|
|
|
|
|
|
|
return (i << 1) + child;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned eytzinger1_left_child(unsigned i)
|
|
|
|
{
|
|
|
|
return eytzinger1_child(i, 0);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned eytzinger1_right_child(unsigned i)
|
|
|
|
{
|
|
|
|
return eytzinger1_child(i, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned eytzinger1_first(unsigned size)
|
|
|
|
{
|
2022-01-03 13:22:29 +08:00
|
|
|
return rounddown_pow_of_two(size);
|
2017-03-17 14:18:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned eytzinger1_last(unsigned size)
|
|
|
|
{
|
2022-01-03 13:22:29 +08:00
|
|
|
return rounddown_pow_of_two(size + 1) - 1;
|
2017-03-17 14:18:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* eytzinger1_next() and eytzinger1_prev() have the nice properties that
|
|
|
|
*
|
|
|
|
* eytzinger1_next(0) == eytzinger1_first())
|
|
|
|
* eytzinger1_prev(0) == eytzinger1_last())
|
|
|
|
*
|
|
|
|
* eytzinger1_prev(eytzinger1_first()) == 0
|
|
|
|
* eytzinger1_next(eytzinger1_last()) == 0
|
|
|
|
*/
|
|
|
|
|
|
|
|
static inline unsigned eytzinger1_next(unsigned i, unsigned size)
|
|
|
|
{
|
2024-03-23 07:26:33 +08:00
|
|
|
EYTZINGER_BUG_ON(i > size);
|
2017-03-17 14:18:50 +08:00
|
|
|
|
2022-01-03 13:22:29 +08:00
|
|
|
if (eytzinger1_right_child(i) <= size) {
|
2017-03-17 14:18:50 +08:00
|
|
|
i = eytzinger1_right_child(i);
|
|
|
|
|
2022-01-03 13:22:29 +08:00
|
|
|
i <<= __fls(size + 1) - __fls(i);
|
|
|
|
i >>= i > size;
|
2017-03-17 14:18:50 +08:00
|
|
|
} else {
|
|
|
|
i >>= ffz(i) + 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
return i;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned eytzinger1_prev(unsigned i, unsigned size)
|
|
|
|
{
|
2024-03-23 07:26:33 +08:00
|
|
|
EYTZINGER_BUG_ON(i > size);
|
2017-03-17 14:18:50 +08:00
|
|
|
|
2022-01-03 13:22:29 +08:00
|
|
|
if (eytzinger1_left_child(i) <= size) {
|
2017-03-17 14:18:50 +08:00
|
|
|
i = eytzinger1_left_child(i) + 1;
|
|
|
|
|
2022-01-03 13:22:29 +08:00
|
|
|
i <<= __fls(size + 1) - __fls(i);
|
2017-03-17 14:18:50 +08:00
|
|
|
i -= 1;
|
2022-01-03 13:22:29 +08:00
|
|
|
i >>= i > size;
|
2017-03-17 14:18:50 +08:00
|
|
|
} else {
|
|
|
|
i >>= __ffs(i) + 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
return i;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned eytzinger1_extra(unsigned size)
|
|
|
|
{
|
2022-01-03 13:22:29 +08:00
|
|
|
return (size + 1 - rounddown_pow_of_two(size)) << 1;
|
2017-03-17 14:18:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned __eytzinger1_to_inorder(unsigned i, unsigned size,
|
|
|
|
unsigned extra)
|
|
|
|
{
|
|
|
|
unsigned b = __fls(i);
|
2022-01-03 13:22:29 +08:00
|
|
|
unsigned shift = __fls(size) - b;
|
2017-03-17 14:18:50 +08:00
|
|
|
int s;
|
|
|
|
|
2024-03-23 07:26:33 +08:00
|
|
|
EYTZINGER_BUG_ON(!i || i > size);
|
2017-03-17 14:18:50 +08:00
|
|
|
|
|
|
|
i ^= 1U << b;
|
|
|
|
i <<= 1;
|
|
|
|
i |= 1;
|
|
|
|
i <<= shift;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* sign bit trick:
|
|
|
|
*
|
|
|
|
* if (i > extra)
|
|
|
|
* i -= (i - extra) >> 1;
|
|
|
|
*/
|
|
|
|
s = extra - i;
|
|
|
|
i += (s >> 1) & (s >> 31);
|
|
|
|
|
|
|
|
return i;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned __inorder_to_eytzinger1(unsigned i, unsigned size,
|
|
|
|
unsigned extra)
|
|
|
|
{
|
|
|
|
unsigned shift;
|
|
|
|
int s;
|
|
|
|
|
2024-03-23 07:26:33 +08:00
|
|
|
EYTZINGER_BUG_ON(!i || i > size);
|
2017-03-17 14:18:50 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* sign bit trick:
|
|
|
|
*
|
|
|
|
* if (i > extra)
|
|
|
|
* i += i - extra;
|
|
|
|
*/
|
|
|
|
s = extra - i;
|
|
|
|
i -= s & (s >> 31);
|
|
|
|
|
|
|
|
shift = __ffs(i);
|
|
|
|
|
|
|
|
i >>= shift + 1;
|
2022-01-03 13:22:29 +08:00
|
|
|
i |= 1U << (__fls(size) - shift);
|
2017-03-17 14:18:50 +08:00
|
|
|
|
|
|
|
return i;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned eytzinger1_to_inorder(unsigned i, unsigned size)
|
|
|
|
{
|
|
|
|
return __eytzinger1_to_inorder(i, size, eytzinger1_extra(size));
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned inorder_to_eytzinger1(unsigned i, unsigned size)
|
|
|
|
{
|
|
|
|
return __inorder_to_eytzinger1(i, size, eytzinger1_extra(size));
|
|
|
|
}
|
|
|
|
|
|
|
|
#define eytzinger1_for_each(_i, _size) \
|
2024-01-07 08:29:14 +08:00
|
|
|
for (unsigned (_i) = eytzinger1_first((_size)); \
|
2017-03-17 14:18:50 +08:00
|
|
|
(_i) != 0; \
|
|
|
|
(_i) = eytzinger1_next((_i), (_size)))
|
|
|
|
|
|
|
|
/* Zero based indexing version: */
|
|
|
|
|
|
|
|
static inline unsigned eytzinger0_child(unsigned i, unsigned child)
|
|
|
|
{
|
2024-03-23 07:26:33 +08:00
|
|
|
EYTZINGER_BUG_ON(child > 1);
|
2017-03-17 14:18:50 +08:00
|
|
|
|
|
|
|
return (i << 1) + 1 + child;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned eytzinger0_left_child(unsigned i)
|
|
|
|
{
|
|
|
|
return eytzinger0_child(i, 0);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned eytzinger0_right_child(unsigned i)
|
|
|
|
{
|
|
|
|
return eytzinger0_child(i, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned eytzinger0_first(unsigned size)
|
|
|
|
{
|
2022-01-03 13:22:29 +08:00
|
|
|
return eytzinger1_first(size) - 1;
|
2017-03-17 14:18:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned eytzinger0_last(unsigned size)
|
|
|
|
{
|
2022-01-03 13:22:29 +08:00
|
|
|
return eytzinger1_last(size) - 1;
|
2017-03-17 14:18:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned eytzinger0_next(unsigned i, unsigned size)
|
|
|
|
{
|
2022-01-03 13:22:29 +08:00
|
|
|
return eytzinger1_next(i + 1, size) - 1;
|
2017-03-17 14:18:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned eytzinger0_prev(unsigned i, unsigned size)
|
|
|
|
{
|
2022-01-03 13:22:29 +08:00
|
|
|
return eytzinger1_prev(i + 1, size) - 1;
|
2017-03-17 14:18:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned eytzinger0_extra(unsigned size)
|
|
|
|
{
|
2022-01-03 13:22:29 +08:00
|
|
|
return eytzinger1_extra(size);
|
2017-03-17 14:18:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned __eytzinger0_to_inorder(unsigned i, unsigned size,
|
|
|
|
unsigned extra)
|
|
|
|
{
|
2022-01-03 13:22:29 +08:00
|
|
|
return __eytzinger1_to_inorder(i + 1, size, extra) - 1;
|
2017-03-17 14:18:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned __inorder_to_eytzinger0(unsigned i, unsigned size,
|
|
|
|
unsigned extra)
|
|
|
|
{
|
2022-01-03 13:22:29 +08:00
|
|
|
return __inorder_to_eytzinger1(i + 1, size, extra) - 1;
|
2017-03-17 14:18:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned eytzinger0_to_inorder(unsigned i, unsigned size)
|
|
|
|
{
|
|
|
|
return __eytzinger0_to_inorder(i, size, eytzinger0_extra(size));
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned inorder_to_eytzinger0(unsigned i, unsigned size)
|
|
|
|
{
|
|
|
|
return __inorder_to_eytzinger0(i, size, eytzinger0_extra(size));
|
|
|
|
}
|
|
|
|
|
|
|
|
#define eytzinger0_for_each(_i, _size) \
|
2024-01-07 08:29:14 +08:00
|
|
|
for (unsigned (_i) = eytzinger0_first((_size)); \
|
2017-03-17 14:18:50 +08:00
|
|
|
(_i) != -1; \
|
|
|
|
(_i) = eytzinger0_next((_i), (_size)))
|
|
|
|
|
|
|
|
/* return greatest node <= @search, or -1 if not found */
|
2024-04-09 10:32:08 +08:00
|
|
|
static inline int eytzinger0_find_le(void *base, size_t nr, size_t size,
|
|
|
|
cmp_func_t cmp, const void *search)
|
2017-03-17 14:18:50 +08:00
|
|
|
{
|
|
|
|
unsigned i, n = 0;
|
|
|
|
|
|
|
|
if (!nr)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
do {
|
|
|
|
i = n;
|
2024-03-23 07:26:33 +08:00
|
|
|
n = eytzinger0_child(i, cmp(base + i * size, search) <= 0);
|
2017-03-17 14:18:50 +08:00
|
|
|
} while (n < nr);
|
|
|
|
|
|
|
|
if (n & 1) {
|
2024-04-09 10:32:08 +08:00
|
|
|
/*
|
|
|
|
* @i was greater than @search, return previous node:
|
|
|
|
*
|
|
|
|
* if @i was leftmost/smallest element,
|
|
|
|
* eytzinger0_prev(eytzinger0_first())) returns -1, as expected
|
|
|
|
*/
|
2017-03-17 14:18:50 +08:00
|
|
|
return eytzinger0_prev(i, nr);
|
|
|
|
} else {
|
|
|
|
return i;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-04-09 10:32:08 +08:00
|
|
|
static inline int eytzinger0_find_gt(void *base, size_t nr, size_t size,
|
|
|
|
cmp_func_t cmp, const void *search)
|
2024-03-23 07:26:33 +08:00
|
|
|
{
|
|
|
|
ssize_t idx = eytzinger0_find_le(base, nr, size, cmp, search);
|
2024-04-09 10:32:08 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* if eytitzinger0_find_le() returned -1 - no element was <= search - we
|
|
|
|
* want to return the first element; next/prev identities mean this work
|
|
|
|
* as expected
|
|
|
|
*
|
|
|
|
* similarly if find_le() returns last element, we should return -1;
|
|
|
|
* identities mean this all works out:
|
|
|
|
*/
|
|
|
|
return eytzinger0_next(idx, nr);
|
2024-03-23 07:26:33 +08:00
|
|
|
}
|
|
|
|
|
2019-01-22 04:32:13 +08:00
|
|
|
#define eytzinger0_find(base, nr, size, _cmp, search) \
|
|
|
|
({ \
|
2024-01-06 09:02:33 +08:00
|
|
|
void *_base = (base); \
|
|
|
|
const void *_search = (search); \
|
|
|
|
size_t _nr = (nr); \
|
|
|
|
size_t _size = (size); \
|
|
|
|
size_t _i = 0; \
|
2019-01-22 04:32:13 +08:00
|
|
|
int _res; \
|
|
|
|
\
|
|
|
|
while (_i < _nr && \
|
2024-03-23 07:26:33 +08:00
|
|
|
(_res = _cmp(_search, _base + _i * _size))) \
|
2019-01-22 04:32:13 +08:00
|
|
|
_i = eytzinger0_child(_i, _res > 0); \
|
|
|
|
_i; \
|
|
|
|
})
|
2017-03-17 14:18:50 +08:00
|
|
|
|
2024-03-23 07:26:33 +08:00
|
|
|
void eytzinger0_sort_r(void *, size_t, size_t,
|
|
|
|
cmp_r_func_t, swap_r_func_t, const void *);
|
|
|
|
void eytzinger0_sort(void *, size_t, size_t, cmp_func_t, swap_func_t);
|
2017-03-17 14:18:50 +08:00
|
|
|
|
|
|
|
#endif /* _EYTZINGER_H */
|