mirror of
https://github.com/qemu/qemu.git
synced 2024-12-15 15:33:29 +08:00
cedb70eafb
Since we already have bitmap_mutex to protect either the dirty bitmap or the clear log bitmap, we don't need atomic operations to set/clear/test on the clear log bitmap. Switching all ops from atomic to non-atomic versions, meanwhile touch up the comments to show which lock is in charge. Introduced non-atomic version of bitmap_test_and_clear_atomic(), mostly the same as the atomic version but simplified a few places, e.g. dropped the "old_bits" variable, and also the explicit memory barriers. Reviewed-by: Dr. David Alan Gilbert <dgilbert@redhat.com> Signed-off-by: Peter Xu <peterx@redhat.com> Reviewed-by: Juan Quintela <quintela@redhat.com> Signed-off-by: Juan Quintela <quintela@redhat.com>
535 lines
14 KiB
C
535 lines
14 KiB
C
/*
|
|
* Bitmap Module
|
|
*
|
|
* Stolen from linux/src/lib/bitmap.c
|
|
*
|
|
* Copyright (C) 2010 Corentin Chary
|
|
*
|
|
* This source code is licensed under the GNU General Public License,
|
|
* Version 2.
|
|
*/
|
|
|
|
#include "qemu/osdep.h"
|
|
#include "qemu/bitops.h"
|
|
#include "qemu/bitmap.h"
|
|
#include "qemu/atomic.h"
|
|
|
|
/*
|
|
* bitmaps provide an array of bits, implemented using an
|
|
* array of unsigned longs. The number of valid bits in a
|
|
* given bitmap does _not_ need to be an exact multiple of
|
|
* BITS_PER_LONG.
|
|
*
|
|
* The possible unused bits in the last, partially used word
|
|
* of a bitmap are 'don't care'. The implementation makes
|
|
* no particular effort to keep them zero. It ensures that
|
|
* their value will not affect the results of any operation.
|
|
* The bitmap operations that return Boolean (bitmap_empty,
|
|
* for example) or scalar (bitmap_weight, for example) results
|
|
* carefully filter out these unused bits from impacting their
|
|
* results.
|
|
*
|
|
* These operations actually hold to a slightly stronger rule:
|
|
* if you don't input any bitmaps to these ops that have some
|
|
* unused bits set, then they won't output any set unused bits
|
|
* in output bitmaps.
|
|
*
|
|
* The byte ordering of bitmaps is more natural on little
|
|
* endian architectures.
|
|
*/
|
|
|
|
int slow_bitmap_empty(const unsigned long *bitmap, long bits)
|
|
{
|
|
long k, lim = bits/BITS_PER_LONG;
|
|
|
|
for (k = 0; k < lim; ++k) {
|
|
if (bitmap[k]) {
|
|
return 0;
|
|
}
|
|
}
|
|
if (bits % BITS_PER_LONG) {
|
|
if (bitmap[k] & BITMAP_LAST_WORD_MASK(bits)) {
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
return 1;
|
|
}
|
|
|
|
int slow_bitmap_full(const unsigned long *bitmap, long bits)
|
|
{
|
|
long k, lim = bits/BITS_PER_LONG;
|
|
|
|
for (k = 0; k < lim; ++k) {
|
|
if (~bitmap[k]) {
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
if (bits % BITS_PER_LONG) {
|
|
if (~bitmap[k] & BITMAP_LAST_WORD_MASK(bits)) {
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
return 1;
|
|
}
|
|
|
|
int slow_bitmap_equal(const unsigned long *bitmap1,
|
|
const unsigned long *bitmap2, long bits)
|
|
{
|
|
long k, lim = bits/BITS_PER_LONG;
|
|
|
|
for (k = 0; k < lim; ++k) {
|
|
if (bitmap1[k] != bitmap2[k]) {
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
if (bits % BITS_PER_LONG) {
|
|
if ((bitmap1[k] ^ bitmap2[k]) & BITMAP_LAST_WORD_MASK(bits)) {
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
return 1;
|
|
}
|
|
|
|
void slow_bitmap_complement(unsigned long *dst, const unsigned long *src,
|
|
long bits)
|
|
{
|
|
long k, lim = bits/BITS_PER_LONG;
|
|
|
|
for (k = 0; k < lim; ++k) {
|
|
dst[k] = ~src[k];
|
|
}
|
|
|
|
if (bits % BITS_PER_LONG) {
|
|
dst[k] = ~src[k] & BITMAP_LAST_WORD_MASK(bits);
|
|
}
|
|
}
|
|
|
|
int slow_bitmap_and(unsigned long *dst, const unsigned long *bitmap1,
|
|
const unsigned long *bitmap2, long bits)
|
|
{
|
|
long k;
|
|
long nr = BITS_TO_LONGS(bits);
|
|
unsigned long result = 0;
|
|
|
|
for (k = 0; k < nr; k++) {
|
|
result |= (dst[k] = bitmap1[k] & bitmap2[k]);
|
|
}
|
|
return result != 0;
|
|
}
|
|
|
|
void slow_bitmap_or(unsigned long *dst, const unsigned long *bitmap1,
|
|
const unsigned long *bitmap2, long bits)
|
|
{
|
|
long k;
|
|
long nr = BITS_TO_LONGS(bits);
|
|
|
|
for (k = 0; k < nr; k++) {
|
|
dst[k] = bitmap1[k] | bitmap2[k];
|
|
}
|
|
}
|
|
|
|
void slow_bitmap_xor(unsigned long *dst, const unsigned long *bitmap1,
|
|
const unsigned long *bitmap2, long bits)
|
|
{
|
|
long k;
|
|
long nr = BITS_TO_LONGS(bits);
|
|
|
|
for (k = 0; k < nr; k++) {
|
|
dst[k] = bitmap1[k] ^ bitmap2[k];
|
|
}
|
|
}
|
|
|
|
int slow_bitmap_andnot(unsigned long *dst, const unsigned long *bitmap1,
|
|
const unsigned long *bitmap2, long bits)
|
|
{
|
|
long k;
|
|
long nr = BITS_TO_LONGS(bits);
|
|
unsigned long result = 0;
|
|
|
|
for (k = 0; k < nr; k++) {
|
|
result |= (dst[k] = bitmap1[k] & ~bitmap2[k]);
|
|
}
|
|
return result != 0;
|
|
}
|
|
|
|
void bitmap_set(unsigned long *map, long start, long nr)
|
|
{
|
|
unsigned long *p = map + BIT_WORD(start);
|
|
const long size = start + nr;
|
|
int bits_to_set = BITS_PER_LONG - (start % BITS_PER_LONG);
|
|
unsigned long mask_to_set = BITMAP_FIRST_WORD_MASK(start);
|
|
|
|
assert(start >= 0 && nr >= 0);
|
|
|
|
while (nr - bits_to_set >= 0) {
|
|
*p |= mask_to_set;
|
|
nr -= bits_to_set;
|
|
bits_to_set = BITS_PER_LONG;
|
|
mask_to_set = ~0UL;
|
|
p++;
|
|
}
|
|
if (nr) {
|
|
mask_to_set &= BITMAP_LAST_WORD_MASK(size);
|
|
*p |= mask_to_set;
|
|
}
|
|
}
|
|
|
|
void bitmap_set_atomic(unsigned long *map, long start, long nr)
|
|
{
|
|
unsigned long *p = map + BIT_WORD(start);
|
|
const long size = start + nr;
|
|
int bits_to_set = BITS_PER_LONG - (start % BITS_PER_LONG);
|
|
unsigned long mask_to_set = BITMAP_FIRST_WORD_MASK(start);
|
|
|
|
assert(start >= 0 && nr >= 0);
|
|
|
|
/* First word */
|
|
if (nr - bits_to_set > 0) {
|
|
qatomic_or(p, mask_to_set);
|
|
nr -= bits_to_set;
|
|
bits_to_set = BITS_PER_LONG;
|
|
mask_to_set = ~0UL;
|
|
p++;
|
|
}
|
|
|
|
/* Full words */
|
|
if (bits_to_set == BITS_PER_LONG) {
|
|
while (nr >= BITS_PER_LONG) {
|
|
*p = ~0UL;
|
|
nr -= BITS_PER_LONG;
|
|
p++;
|
|
}
|
|
}
|
|
|
|
/* Last word */
|
|
if (nr) {
|
|
mask_to_set &= BITMAP_LAST_WORD_MASK(size);
|
|
qatomic_or(p, mask_to_set);
|
|
} else {
|
|
/* If we avoided the full barrier in qatomic_or(), issue a
|
|
* barrier to account for the assignments in the while loop.
|
|
*/
|
|
smp_mb();
|
|
}
|
|
}
|
|
|
|
void bitmap_clear(unsigned long *map, long start, long nr)
|
|
{
|
|
unsigned long *p = map + BIT_WORD(start);
|
|
const long size = start + nr;
|
|
int bits_to_clear = BITS_PER_LONG - (start % BITS_PER_LONG);
|
|
unsigned long mask_to_clear = BITMAP_FIRST_WORD_MASK(start);
|
|
|
|
assert(start >= 0 && nr >= 0);
|
|
|
|
while (nr - bits_to_clear >= 0) {
|
|
*p &= ~mask_to_clear;
|
|
nr -= bits_to_clear;
|
|
bits_to_clear = BITS_PER_LONG;
|
|
mask_to_clear = ~0UL;
|
|
p++;
|
|
}
|
|
if (nr) {
|
|
mask_to_clear &= BITMAP_LAST_WORD_MASK(size);
|
|
*p &= ~mask_to_clear;
|
|
}
|
|
}
|
|
|
|
bool bitmap_test_and_clear(unsigned long *map, long start, long nr)
|
|
{
|
|
unsigned long *p = map + BIT_WORD(start);
|
|
const long size = start + nr;
|
|
int bits_to_clear = BITS_PER_LONG - (start % BITS_PER_LONG);
|
|
unsigned long mask_to_clear = BITMAP_FIRST_WORD_MASK(start);
|
|
bool dirty = false;
|
|
|
|
assert(start >= 0 && nr >= 0);
|
|
|
|
/* First word */
|
|
if (nr - bits_to_clear > 0) {
|
|
if ((*p) & mask_to_clear) {
|
|
dirty = true;
|
|
}
|
|
*p &= ~mask_to_clear;
|
|
nr -= bits_to_clear;
|
|
bits_to_clear = BITS_PER_LONG;
|
|
p++;
|
|
}
|
|
|
|
/* Full words */
|
|
if (bits_to_clear == BITS_PER_LONG) {
|
|
while (nr >= BITS_PER_LONG) {
|
|
if (*p) {
|
|
dirty = true;
|
|
*p = 0;
|
|
}
|
|
nr -= BITS_PER_LONG;
|
|
p++;
|
|
}
|
|
}
|
|
|
|
/* Last word */
|
|
if (nr) {
|
|
mask_to_clear &= BITMAP_LAST_WORD_MASK(size);
|
|
if ((*p) & mask_to_clear) {
|
|
dirty = true;
|
|
}
|
|
*p &= ~mask_to_clear;
|
|
}
|
|
|
|
return dirty;
|
|
}
|
|
|
|
bool bitmap_test_and_clear_atomic(unsigned long *map, long start, long nr)
|
|
{
|
|
unsigned long *p = map + BIT_WORD(start);
|
|
const long size = start + nr;
|
|
int bits_to_clear = BITS_PER_LONG - (start % BITS_PER_LONG);
|
|
unsigned long mask_to_clear = BITMAP_FIRST_WORD_MASK(start);
|
|
unsigned long dirty = 0;
|
|
unsigned long old_bits;
|
|
|
|
assert(start >= 0 && nr >= 0);
|
|
|
|
/* First word */
|
|
if (nr - bits_to_clear > 0) {
|
|
old_bits = qatomic_fetch_and(p, ~mask_to_clear);
|
|
dirty |= old_bits & mask_to_clear;
|
|
nr -= bits_to_clear;
|
|
bits_to_clear = BITS_PER_LONG;
|
|
mask_to_clear = ~0UL;
|
|
p++;
|
|
}
|
|
|
|
/* Full words */
|
|
if (bits_to_clear == BITS_PER_LONG) {
|
|
while (nr >= BITS_PER_LONG) {
|
|
if (*p) {
|
|
old_bits = qatomic_xchg(p, 0);
|
|
dirty |= old_bits;
|
|
}
|
|
nr -= BITS_PER_LONG;
|
|
p++;
|
|
}
|
|
}
|
|
|
|
/* Last word */
|
|
if (nr) {
|
|
mask_to_clear &= BITMAP_LAST_WORD_MASK(size);
|
|
old_bits = qatomic_fetch_and(p, ~mask_to_clear);
|
|
dirty |= old_bits & mask_to_clear;
|
|
} else {
|
|
if (!dirty) {
|
|
smp_mb();
|
|
}
|
|
}
|
|
|
|
return dirty != 0;
|
|
}
|
|
|
|
void bitmap_copy_and_clear_atomic(unsigned long *dst, unsigned long *src,
|
|
long nr)
|
|
{
|
|
while (nr > 0) {
|
|
*dst = qatomic_xchg(src, 0);
|
|
dst++;
|
|
src++;
|
|
nr -= BITS_PER_LONG;
|
|
}
|
|
}
|
|
|
|
#define ALIGN_MASK(x,mask) (((x)+(mask))&~(mask))
|
|
|
|
/**
|
|
* bitmap_find_next_zero_area - find a contiguous aligned zero area
|
|
* @map: The address to base the search on
|
|
* @size: The bitmap size in bits
|
|
* @start: The bitnumber to start searching at
|
|
* @nr: The number of zeroed bits we're looking for
|
|
* @align_mask: Alignment mask for zero area
|
|
*
|
|
* The @align_mask should be one less than a power of 2; the effect is that
|
|
* the bit offset of all zero areas this function finds is multiples of that
|
|
* power of 2. A @align_mask of 0 means no alignment is required.
|
|
*/
|
|
unsigned long bitmap_find_next_zero_area(unsigned long *map,
|
|
unsigned long size,
|
|
unsigned long start,
|
|
unsigned long nr,
|
|
unsigned long align_mask)
|
|
{
|
|
unsigned long index, end, i;
|
|
again:
|
|
index = find_next_zero_bit(map, size, start);
|
|
|
|
/* Align allocation */
|
|
index = ALIGN_MASK(index, align_mask);
|
|
|
|
end = index + nr;
|
|
if (end > size) {
|
|
return end;
|
|
}
|
|
i = find_next_bit(map, end, index);
|
|
if (i < end) {
|
|
start = i + 1;
|
|
goto again;
|
|
}
|
|
return index;
|
|
}
|
|
|
|
int slow_bitmap_intersects(const unsigned long *bitmap1,
|
|
const unsigned long *bitmap2, long bits)
|
|
{
|
|
long k, lim = bits/BITS_PER_LONG;
|
|
|
|
for (k = 0; k < lim; ++k) {
|
|
if (bitmap1[k] & bitmap2[k]) {
|
|
return 1;
|
|
}
|
|
}
|
|
|
|
if (bits % BITS_PER_LONG) {
|
|
if ((bitmap1[k] & bitmap2[k]) & BITMAP_LAST_WORD_MASK(bits)) {
|
|
return 1;
|
|
}
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
long slow_bitmap_count_one(const unsigned long *bitmap, long nbits)
|
|
{
|
|
long k, lim = nbits / BITS_PER_LONG, result = 0;
|
|
|
|
for (k = 0; k < lim; k++) {
|
|
result += ctpopl(bitmap[k]);
|
|
}
|
|
|
|
if (nbits % BITS_PER_LONG) {
|
|
result += ctpopl(bitmap[k] & BITMAP_LAST_WORD_MASK(nbits));
|
|
}
|
|
|
|
return result;
|
|
}
|
|
|
|
static void bitmap_to_from_le(unsigned long *dst,
|
|
const unsigned long *src, long nbits)
|
|
{
|
|
long len = BITS_TO_LONGS(nbits);
|
|
|
|
#if HOST_BIG_ENDIAN
|
|
long index;
|
|
|
|
for (index = 0; index < len; index++) {
|
|
# if HOST_LONG_BITS == 64
|
|
dst[index] = bswap64(src[index]);
|
|
# else
|
|
dst[index] = bswap32(src[index]);
|
|
# endif
|
|
}
|
|
#else
|
|
memcpy(dst, src, len * sizeof(unsigned long));
|
|
#endif
|
|
}
|
|
|
|
void bitmap_from_le(unsigned long *dst, const unsigned long *src,
|
|
long nbits)
|
|
{
|
|
bitmap_to_from_le(dst, src, nbits);
|
|
}
|
|
|
|
void bitmap_to_le(unsigned long *dst, const unsigned long *src,
|
|
long nbits)
|
|
{
|
|
bitmap_to_from_le(dst, src, nbits);
|
|
}
|
|
|
|
/*
|
|
* Copy "src" bitmap with a positive offset and put it into the "dst"
|
|
* bitmap. The caller needs to make sure the bitmap size of "src"
|
|
* is bigger than (shift + nbits).
|
|
*/
|
|
void bitmap_copy_with_src_offset(unsigned long *dst, const unsigned long *src,
|
|
unsigned long shift, unsigned long nbits)
|
|
{
|
|
unsigned long left_mask, right_mask, last_mask;
|
|
|
|
/* Proper shift src pointer to the first word to copy from */
|
|
src += BIT_WORD(shift);
|
|
shift %= BITS_PER_LONG;
|
|
|
|
if (!shift) {
|
|
/* Fast path */
|
|
bitmap_copy(dst, src, nbits);
|
|
return;
|
|
}
|
|
|
|
right_mask = (1ul << shift) - 1;
|
|
left_mask = ~right_mask;
|
|
|
|
while (nbits >= BITS_PER_LONG) {
|
|
*dst = (*src & left_mask) >> shift;
|
|
*dst |= (src[1] & right_mask) << (BITS_PER_LONG - shift);
|
|
dst++;
|
|
src++;
|
|
nbits -= BITS_PER_LONG;
|
|
}
|
|
|
|
if (nbits > BITS_PER_LONG - shift) {
|
|
*dst = (*src & left_mask) >> shift;
|
|
nbits -= BITS_PER_LONG - shift;
|
|
last_mask = (1ul << nbits) - 1;
|
|
*dst |= (src[1] & last_mask) << (BITS_PER_LONG - shift);
|
|
} else if (nbits) {
|
|
last_mask = (1ul << nbits) - 1;
|
|
*dst = (*src >> shift) & last_mask;
|
|
}
|
|
}
|
|
|
|
/*
|
|
* Copy "src" bitmap into the "dst" bitmap with an offset in the
|
|
* "dst". The caller needs to make sure the bitmap size of "dst" is
|
|
* bigger than (shift + nbits).
|
|
*/
|
|
void bitmap_copy_with_dst_offset(unsigned long *dst, const unsigned long *src,
|
|
unsigned long shift, unsigned long nbits)
|
|
{
|
|
unsigned long left_mask, right_mask, last_mask;
|
|
|
|
/* Proper shift dst pointer to the first word to copy from */
|
|
dst += BIT_WORD(shift);
|
|
shift %= BITS_PER_LONG;
|
|
|
|
if (!shift) {
|
|
/* Fast path */
|
|
bitmap_copy(dst, src, nbits);
|
|
return;
|
|
}
|
|
|
|
right_mask = (1ul << (BITS_PER_LONG - shift)) - 1;
|
|
left_mask = ~right_mask;
|
|
|
|
*dst &= (1ul << shift) - 1;
|
|
while (nbits >= BITS_PER_LONG) {
|
|
*dst |= (*src & right_mask) << shift;
|
|
dst[1] = (*src & left_mask) >> (BITS_PER_LONG - shift);
|
|
dst++;
|
|
src++;
|
|
nbits -= BITS_PER_LONG;
|
|
}
|
|
|
|
if (nbits > BITS_PER_LONG - shift) {
|
|
*dst |= (*src & right_mask) << shift;
|
|
nbits -= BITS_PER_LONG - shift;
|
|
last_mask = ((1ul << nbits) - 1) << (BITS_PER_LONG - shift);
|
|
dst[1] = (*src & last_mask) >> (BITS_PER_LONG - shift);
|
|
} else if (nbits) {
|
|
last_mask = (1ul << nbits) - 1;
|
|
*dst |= (*src & last_mask) << shift;
|
|
}
|
|
}
|