mirror of
				https://github.com/qemu/qemu.git
				synced 2025-10-25 03:03:32 +00:00 
			
		
		
		
	 cedb70eafb
			
		
	
	
		cedb70eafb
		
	
	
	
	
		
			
			Since we already have bitmap_mutex to protect either the dirty bitmap or the clear log bitmap, we don't need atomic operations to set/clear/test on the clear log bitmap. Switching all ops from atomic to non-atomic versions, meanwhile touch up the comments to show which lock is in charge. Introduced non-atomic version of bitmap_test_and_clear_atomic(), mostly the same as the atomic version but simplified a few places, e.g. dropped the "old_bits" variable, and also the explicit memory barriers. Reviewed-by: Dr. David Alan Gilbert <dgilbert@redhat.com> Signed-off-by: Peter Xu <peterx@redhat.com> Reviewed-by: Juan Quintela <quintela@redhat.com> Signed-off-by: Juan Quintela <quintela@redhat.com>
		
			
				
	
	
		
			535 lines
		
	
	
		
			14 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			535 lines
		
	
	
		
			14 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * Bitmap Module
 | |
|  *
 | |
|  * Stolen from linux/src/lib/bitmap.c
 | |
|  *
 | |
|  * Copyright (C) 2010 Corentin Chary
 | |
|  *
 | |
|  * This source code is licensed under the GNU General Public License,
 | |
|  * Version 2.
 | |
|  */
 | |
| 
 | |
| #include "qemu/osdep.h"
 | |
| #include "qemu/bitops.h"
 | |
| #include "qemu/bitmap.h"
 | |
| #include "qemu/atomic.h"
 | |
| 
 | |
| /*
 | |
|  * bitmaps provide an array of bits, implemented using an
 | |
|  * array of unsigned longs.  The number of valid bits in a
 | |
|  * given bitmap does _not_ need to be an exact multiple of
 | |
|  * BITS_PER_LONG.
 | |
|  *
 | |
|  * The possible unused bits in the last, partially used word
 | |
|  * of a bitmap are 'don't care'.  The implementation makes
 | |
|  * no particular effort to keep them zero.  It ensures that
 | |
|  * their value will not affect the results of any operation.
 | |
|  * The bitmap operations that return Boolean (bitmap_empty,
 | |
|  * for example) or scalar (bitmap_weight, for example) results
 | |
|  * carefully filter out these unused bits from impacting their
 | |
|  * results.
 | |
|  *
 | |
|  * These operations actually hold to a slightly stronger rule:
 | |
|  * if you don't input any bitmaps to these ops that have some
 | |
|  * unused bits set, then they won't output any set unused bits
 | |
|  * in output bitmaps.
 | |
|  *
 | |
|  * The byte ordering of bitmaps is more natural on little
 | |
|  * endian architectures.
 | |
|  */
 | |
| 
 | |
| int slow_bitmap_empty(const unsigned long *bitmap, long bits)
 | |
| {
 | |
|     long k, lim = bits/BITS_PER_LONG;
 | |
| 
 | |
|     for (k = 0; k < lim; ++k) {
 | |
|         if (bitmap[k]) {
 | |
|             return 0;
 | |
|         }
 | |
|     }
 | |
|     if (bits % BITS_PER_LONG) {
 | |
|         if (bitmap[k] & BITMAP_LAST_WORD_MASK(bits)) {
 | |
|             return 0;
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     return 1;
 | |
| }
 | |
| 
 | |
| int slow_bitmap_full(const unsigned long *bitmap, long bits)
 | |
| {
 | |
|     long k, lim = bits/BITS_PER_LONG;
 | |
| 
 | |
|     for (k = 0; k < lim; ++k) {
 | |
|         if (~bitmap[k]) {
 | |
|             return 0;
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     if (bits % BITS_PER_LONG) {
 | |
|         if (~bitmap[k] & BITMAP_LAST_WORD_MASK(bits)) {
 | |
|             return 0;
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     return 1;
 | |
| }
 | |
| 
 | |
| int slow_bitmap_equal(const unsigned long *bitmap1,
 | |
|                       const unsigned long *bitmap2, long bits)
 | |
| {
 | |
|     long k, lim = bits/BITS_PER_LONG;
 | |
| 
 | |
|     for (k = 0; k < lim; ++k) {
 | |
|         if (bitmap1[k] != bitmap2[k]) {
 | |
|             return 0;
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     if (bits % BITS_PER_LONG) {
 | |
|         if ((bitmap1[k] ^ bitmap2[k]) & BITMAP_LAST_WORD_MASK(bits)) {
 | |
|             return 0;
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     return 1;
 | |
| }
 | |
| 
 | |
| void slow_bitmap_complement(unsigned long *dst, const unsigned long *src,
 | |
|                             long bits)
 | |
| {
 | |
|     long k, lim = bits/BITS_PER_LONG;
 | |
| 
 | |
|     for (k = 0; k < lim; ++k) {
 | |
|         dst[k] = ~src[k];
 | |
|     }
 | |
| 
 | |
|     if (bits % BITS_PER_LONG) {
 | |
|         dst[k] = ~src[k] & BITMAP_LAST_WORD_MASK(bits);
 | |
|     }
 | |
| }
 | |
| 
 | |
| int slow_bitmap_and(unsigned long *dst, const unsigned long *bitmap1,
 | |
|                     const unsigned long *bitmap2, long bits)
 | |
| {
 | |
|     long k;
 | |
|     long nr = BITS_TO_LONGS(bits);
 | |
|     unsigned long result = 0;
 | |
| 
 | |
|     for (k = 0; k < nr; k++) {
 | |
|         result |= (dst[k] = bitmap1[k] & bitmap2[k]);
 | |
|     }
 | |
|     return result != 0;
 | |
| }
 | |
| 
 | |
| void slow_bitmap_or(unsigned long *dst, const unsigned long *bitmap1,
 | |
|                     const unsigned long *bitmap2, long bits)
 | |
| {
 | |
|     long k;
 | |
|     long nr = BITS_TO_LONGS(bits);
 | |
| 
 | |
|     for (k = 0; k < nr; k++) {
 | |
|         dst[k] = bitmap1[k] | bitmap2[k];
 | |
|     }
 | |
| }
 | |
| 
 | |
| void slow_bitmap_xor(unsigned long *dst, const unsigned long *bitmap1,
 | |
|                      const unsigned long *bitmap2, long bits)
 | |
| {
 | |
|     long k;
 | |
|     long nr = BITS_TO_LONGS(bits);
 | |
| 
 | |
|     for (k = 0; k < nr; k++) {
 | |
|         dst[k] = bitmap1[k] ^ bitmap2[k];
 | |
|     }
 | |
| }
 | |
| 
 | |
| int slow_bitmap_andnot(unsigned long *dst, const unsigned long *bitmap1,
 | |
|                        const unsigned long *bitmap2, long bits)
 | |
| {
 | |
|     long k;
 | |
|     long nr = BITS_TO_LONGS(bits);
 | |
|     unsigned long result = 0;
 | |
| 
 | |
|     for (k = 0; k < nr; k++) {
 | |
|         result |= (dst[k] = bitmap1[k] & ~bitmap2[k]);
 | |
|     }
 | |
|     return result != 0;
 | |
| }
 | |
| 
 | |
| void bitmap_set(unsigned long *map, long start, long nr)
 | |
| {
 | |
|     unsigned long *p = map + BIT_WORD(start);
 | |
|     const long size = start + nr;
 | |
|     int bits_to_set = BITS_PER_LONG - (start % BITS_PER_LONG);
 | |
|     unsigned long mask_to_set = BITMAP_FIRST_WORD_MASK(start);
 | |
| 
 | |
|     assert(start >= 0 && nr >= 0);
 | |
| 
 | |
|     while (nr - bits_to_set >= 0) {
 | |
|         *p |= mask_to_set;
 | |
|         nr -= bits_to_set;
 | |
|         bits_to_set = BITS_PER_LONG;
 | |
|         mask_to_set = ~0UL;
 | |
|         p++;
 | |
|     }
 | |
|     if (nr) {
 | |
|         mask_to_set &= BITMAP_LAST_WORD_MASK(size);
 | |
|         *p |= mask_to_set;
 | |
|     }
 | |
| }
 | |
| 
 | |
| void bitmap_set_atomic(unsigned long *map, long start, long nr)
 | |
| {
 | |
|     unsigned long *p = map + BIT_WORD(start);
 | |
|     const long size = start + nr;
 | |
|     int bits_to_set = BITS_PER_LONG - (start % BITS_PER_LONG);
 | |
|     unsigned long mask_to_set = BITMAP_FIRST_WORD_MASK(start);
 | |
| 
 | |
|     assert(start >= 0 && nr >= 0);
 | |
| 
 | |
|     /* First word */
 | |
|     if (nr - bits_to_set > 0) {
 | |
|         qatomic_or(p, mask_to_set);
 | |
|         nr -= bits_to_set;
 | |
|         bits_to_set = BITS_PER_LONG;
 | |
|         mask_to_set = ~0UL;
 | |
|         p++;
 | |
|     }
 | |
| 
 | |
|     /* Full words */
 | |
|     if (bits_to_set == BITS_PER_LONG) {
 | |
|         while (nr >= BITS_PER_LONG) {
 | |
|             *p = ~0UL;
 | |
|             nr -= BITS_PER_LONG;
 | |
|             p++;
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     /* Last word */
 | |
|     if (nr) {
 | |
|         mask_to_set &= BITMAP_LAST_WORD_MASK(size);
 | |
|         qatomic_or(p, mask_to_set);
 | |
|     } else {
 | |
|         /* If we avoided the full barrier in qatomic_or(), issue a
 | |
|          * barrier to account for the assignments in the while loop.
 | |
|          */
 | |
|         smp_mb();
 | |
|     }
 | |
| }
 | |
| 
 | |
| void bitmap_clear(unsigned long *map, long start, long nr)
 | |
| {
 | |
|     unsigned long *p = map + BIT_WORD(start);
 | |
|     const long size = start + nr;
 | |
|     int bits_to_clear = BITS_PER_LONG - (start % BITS_PER_LONG);
 | |
|     unsigned long mask_to_clear = BITMAP_FIRST_WORD_MASK(start);
 | |
| 
 | |
|     assert(start >= 0 && nr >= 0);
 | |
| 
 | |
|     while (nr - bits_to_clear >= 0) {
 | |
|         *p &= ~mask_to_clear;
 | |
|         nr -= bits_to_clear;
 | |
|         bits_to_clear = BITS_PER_LONG;
 | |
|         mask_to_clear = ~0UL;
 | |
|         p++;
 | |
|     }
 | |
|     if (nr) {
 | |
|         mask_to_clear &= BITMAP_LAST_WORD_MASK(size);
 | |
|         *p &= ~mask_to_clear;
 | |
|     }
 | |
| }
 | |
| 
 | |
| bool bitmap_test_and_clear(unsigned long *map, long start, long nr)
 | |
| {
 | |
|     unsigned long *p = map + BIT_WORD(start);
 | |
|     const long size = start + nr;
 | |
|     int bits_to_clear = BITS_PER_LONG - (start % BITS_PER_LONG);
 | |
|     unsigned long mask_to_clear = BITMAP_FIRST_WORD_MASK(start);
 | |
|     bool dirty = false;
 | |
| 
 | |
|     assert(start >= 0 && nr >= 0);
 | |
| 
 | |
|     /* First word */
 | |
|     if (nr - bits_to_clear > 0) {
 | |
|         if ((*p) & mask_to_clear) {
 | |
|             dirty = true;
 | |
|         }
 | |
|         *p &= ~mask_to_clear;
 | |
|         nr -= bits_to_clear;
 | |
|         bits_to_clear = BITS_PER_LONG;
 | |
|         p++;
 | |
|     }
 | |
| 
 | |
|     /* Full words */
 | |
|     if (bits_to_clear == BITS_PER_LONG) {
 | |
|         while (nr >= BITS_PER_LONG) {
 | |
|             if (*p) {
 | |
|                 dirty = true;
 | |
|                 *p = 0;
 | |
|             }
 | |
|             nr -= BITS_PER_LONG;
 | |
|             p++;
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     /* Last word */
 | |
|     if (nr) {
 | |
|         mask_to_clear &= BITMAP_LAST_WORD_MASK(size);
 | |
|         if ((*p) & mask_to_clear) {
 | |
|             dirty = true;
 | |
|         }
 | |
|         *p &= ~mask_to_clear;
 | |
|     }
 | |
| 
 | |
|     return dirty;
 | |
| }
 | |
| 
 | |
| bool bitmap_test_and_clear_atomic(unsigned long *map, long start, long nr)
 | |
| {
 | |
|     unsigned long *p = map + BIT_WORD(start);
 | |
|     const long size = start + nr;
 | |
|     int bits_to_clear = BITS_PER_LONG - (start % BITS_PER_LONG);
 | |
|     unsigned long mask_to_clear = BITMAP_FIRST_WORD_MASK(start);
 | |
|     unsigned long dirty = 0;
 | |
|     unsigned long old_bits;
 | |
| 
 | |
|     assert(start >= 0 && nr >= 0);
 | |
| 
 | |
|     /* First word */
 | |
|     if (nr - bits_to_clear > 0) {
 | |
|         old_bits = qatomic_fetch_and(p, ~mask_to_clear);
 | |
|         dirty |= old_bits & mask_to_clear;
 | |
|         nr -= bits_to_clear;
 | |
|         bits_to_clear = BITS_PER_LONG;
 | |
|         mask_to_clear = ~0UL;
 | |
|         p++;
 | |
|     }
 | |
| 
 | |
|     /* Full words */
 | |
|     if (bits_to_clear == BITS_PER_LONG) {
 | |
|         while (nr >= BITS_PER_LONG) {
 | |
|             if (*p) {
 | |
|                 old_bits = qatomic_xchg(p, 0);
 | |
|                 dirty |= old_bits;
 | |
|             }
 | |
|             nr -= BITS_PER_LONG;
 | |
|             p++;
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     /* Last word */
 | |
|     if (nr) {
 | |
|         mask_to_clear &= BITMAP_LAST_WORD_MASK(size);
 | |
|         old_bits = qatomic_fetch_and(p, ~mask_to_clear);
 | |
|         dirty |= old_bits & mask_to_clear;
 | |
|     } else {
 | |
|         if (!dirty) {
 | |
|             smp_mb();
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     return dirty != 0;
 | |
| }
 | |
| 
 | |
| void bitmap_copy_and_clear_atomic(unsigned long *dst, unsigned long *src,
 | |
|                                   long nr)
 | |
| {
 | |
|     while (nr > 0) {
 | |
|         *dst = qatomic_xchg(src, 0);
 | |
|         dst++;
 | |
|         src++;
 | |
|         nr -= BITS_PER_LONG;
 | |
|     }
 | |
| }
 | |
| 
 | |
| #define ALIGN_MASK(x,mask)      (((x)+(mask))&~(mask))
 | |
| 
 | |
| /**
 | |
|  * bitmap_find_next_zero_area - find a contiguous aligned zero area
 | |
|  * @map: The address to base the search on
 | |
|  * @size: The bitmap size in bits
 | |
|  * @start: The bitnumber to start searching at
 | |
|  * @nr: The number of zeroed bits we're looking for
 | |
|  * @align_mask: Alignment mask for zero area
 | |
|  *
 | |
|  * The @align_mask should be one less than a power of 2; the effect is that
 | |
|  * the bit offset of all zero areas this function finds is multiples of that
 | |
|  * power of 2. A @align_mask of 0 means no alignment is required.
 | |
|  */
 | |
| unsigned long bitmap_find_next_zero_area(unsigned long *map,
 | |
|                                          unsigned long size,
 | |
|                                          unsigned long start,
 | |
|                                          unsigned long nr,
 | |
|                                          unsigned long align_mask)
 | |
| {
 | |
|     unsigned long index, end, i;
 | |
| again:
 | |
|     index = find_next_zero_bit(map, size, start);
 | |
| 
 | |
|     /* Align allocation */
 | |
|     index = ALIGN_MASK(index, align_mask);
 | |
| 
 | |
|     end = index + nr;
 | |
|     if (end > size) {
 | |
|         return end;
 | |
|     }
 | |
|     i = find_next_bit(map, end, index);
 | |
|     if (i < end) {
 | |
|         start = i + 1;
 | |
|         goto again;
 | |
|     }
 | |
|     return index;
 | |
| }
 | |
| 
 | |
| int slow_bitmap_intersects(const unsigned long *bitmap1,
 | |
|                            const unsigned long *bitmap2, long bits)
 | |
| {
 | |
|     long k, lim = bits/BITS_PER_LONG;
 | |
| 
 | |
|     for (k = 0; k < lim; ++k) {
 | |
|         if (bitmap1[k] & bitmap2[k]) {
 | |
|             return 1;
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     if (bits % BITS_PER_LONG) {
 | |
|         if ((bitmap1[k] & bitmap2[k]) & BITMAP_LAST_WORD_MASK(bits)) {
 | |
|             return 1;
 | |
|         }
 | |
|     }
 | |
|     return 0;
 | |
| }
 | |
| 
 | |
| long slow_bitmap_count_one(const unsigned long *bitmap, long nbits)
 | |
| {
 | |
|     long k, lim = nbits / BITS_PER_LONG, result = 0;
 | |
| 
 | |
|     for (k = 0; k < lim; k++) {
 | |
|         result += ctpopl(bitmap[k]);
 | |
|     }
 | |
| 
 | |
|     if (nbits % BITS_PER_LONG) {
 | |
|         result += ctpopl(bitmap[k] & BITMAP_LAST_WORD_MASK(nbits));
 | |
|     }
 | |
| 
 | |
|     return result;
 | |
| }
 | |
| 
 | |
| static void bitmap_to_from_le(unsigned long *dst,
 | |
|                               const unsigned long *src, long nbits)
 | |
| {
 | |
|     long len = BITS_TO_LONGS(nbits);
 | |
| 
 | |
| #if HOST_BIG_ENDIAN
 | |
|     long index;
 | |
| 
 | |
|     for (index = 0; index < len; index++) {
 | |
| # if HOST_LONG_BITS == 64
 | |
|         dst[index] = bswap64(src[index]);
 | |
| # else
 | |
|         dst[index] = bswap32(src[index]);
 | |
| # endif
 | |
|     }
 | |
| #else
 | |
|     memcpy(dst, src, len * sizeof(unsigned long));
 | |
| #endif
 | |
| }
 | |
| 
 | |
| void bitmap_from_le(unsigned long *dst, const unsigned long *src,
 | |
|                     long nbits)
 | |
| {
 | |
|     bitmap_to_from_le(dst, src, nbits);
 | |
| }
 | |
| 
 | |
| void bitmap_to_le(unsigned long *dst, const unsigned long *src,
 | |
|                   long nbits)
 | |
| {
 | |
|     bitmap_to_from_le(dst, src, nbits);
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * Copy "src" bitmap with a positive offset and put it into the "dst"
 | |
|  * bitmap.  The caller needs to make sure the bitmap size of "src"
 | |
|  * is bigger than (shift + nbits).
 | |
|  */
 | |
| void bitmap_copy_with_src_offset(unsigned long *dst, const unsigned long *src,
 | |
|                                  unsigned long shift, unsigned long nbits)
 | |
| {
 | |
|     unsigned long left_mask, right_mask, last_mask;
 | |
| 
 | |
|     /* Proper shift src pointer to the first word to copy from */
 | |
|     src += BIT_WORD(shift);
 | |
|     shift %= BITS_PER_LONG;
 | |
| 
 | |
|     if (!shift) {
 | |
|         /* Fast path */
 | |
|         bitmap_copy(dst, src, nbits);
 | |
|         return;
 | |
|     }
 | |
| 
 | |
|     right_mask = (1ul << shift) - 1;
 | |
|     left_mask = ~right_mask;
 | |
| 
 | |
|     while (nbits >= BITS_PER_LONG) {
 | |
|         *dst = (*src & left_mask) >> shift;
 | |
|         *dst |= (src[1] & right_mask) << (BITS_PER_LONG - shift);
 | |
|         dst++;
 | |
|         src++;
 | |
|         nbits -= BITS_PER_LONG;
 | |
|     }
 | |
| 
 | |
|     if (nbits > BITS_PER_LONG - shift) {
 | |
|         *dst = (*src & left_mask) >> shift;
 | |
|         nbits -= BITS_PER_LONG - shift;
 | |
|         last_mask = (1ul << nbits) - 1;
 | |
|         *dst |= (src[1] & last_mask) << (BITS_PER_LONG - shift);
 | |
|     } else if (nbits) {
 | |
|         last_mask = (1ul << nbits) - 1;
 | |
|         *dst = (*src >> shift) & last_mask;
 | |
|     }
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * Copy "src" bitmap into the "dst" bitmap with an offset in the
 | |
|  * "dst".  The caller needs to make sure the bitmap size of "dst" is
 | |
|  * bigger than (shift + nbits).
 | |
|  */
 | |
| void bitmap_copy_with_dst_offset(unsigned long *dst, const unsigned long *src,
 | |
|                                  unsigned long shift, unsigned long nbits)
 | |
| {
 | |
|     unsigned long left_mask, right_mask, last_mask;
 | |
| 
 | |
|     /* Proper shift dst pointer to the first word to copy from */
 | |
|     dst += BIT_WORD(shift);
 | |
|     shift %= BITS_PER_LONG;
 | |
| 
 | |
|     if (!shift) {
 | |
|         /* Fast path */
 | |
|         bitmap_copy(dst, src, nbits);
 | |
|         return;
 | |
|     }
 | |
| 
 | |
|     right_mask = (1ul << (BITS_PER_LONG - shift)) - 1;
 | |
|     left_mask = ~right_mask;
 | |
| 
 | |
|     *dst &= (1ul << shift) - 1;
 | |
|     while (nbits >= BITS_PER_LONG) {
 | |
|         *dst |= (*src & right_mask) << shift;
 | |
|         dst[1] = (*src & left_mask) >> (BITS_PER_LONG - shift);
 | |
|         dst++;
 | |
|         src++;
 | |
|         nbits -= BITS_PER_LONG;
 | |
|     }
 | |
| 
 | |
|     if (nbits > BITS_PER_LONG - shift) {
 | |
|         *dst |= (*src & right_mask) << shift;
 | |
|         nbits -= BITS_PER_LONG - shift;
 | |
|         last_mask = ((1ul << nbits) - 1) << (BITS_PER_LONG - shift);
 | |
|         dst[1] = (*src & last_mask) >> (BITS_PER_LONG - shift);
 | |
|     } else if (nbits) {
 | |
|         last_mask = (1ul << nbits) - 1;
 | |
|         *dst |= (*src & last_mask) << shift;
 | |
|     }
 | |
| }
 |