Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 1 | /* |
| 2 | * Bitmap Module |
| 3 | * |
| 4 | * Stolen from linux/src/lib/bitmap.c |
| 5 | * |
| 6 | * Copyright (C) 2010 Corentin Chary |
| 7 | * |
| 8 | * This source code is licensed under the GNU General Public License, |
| 9 | * Version 2. |
| 10 | */ |
| 11 | |
Peter Maydell | aafd758 | 2016-01-29 17:49:55 +0000 | [diff] [blame] | 12 | #include "qemu/osdep.h" |
Paolo Bonzini | 1de7afc | 2012-12-17 18:20:00 +0100 | [diff] [blame] | 13 | #include "qemu/bitops.h" |
| 14 | #include "qemu/bitmap.h" |
Stefan Hajnoczi | 9f02cfc | 2014-12-02 11:23:14 +0000 | [diff] [blame] | 15 | #include "qemu/atomic.h" |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 16 | |
| 17 | /* |
Daniel P. Berrange | b6af097 | 2015-08-26 12:17:13 +0100 | [diff] [blame] | 18 | * bitmaps provide an array of bits, implemented using an |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 19 | * array of unsigned longs. The number of valid bits in a |
| 20 | * given bitmap does _not_ need to be an exact multiple of |
| 21 | * BITS_PER_LONG. |
| 22 | * |
| 23 | * The possible unused bits in the last, partially used word |
| 24 | * of a bitmap are 'don't care'. The implementation makes |
| 25 | * no particular effort to keep them zero. It ensures that |
| 26 | * their value will not affect the results of any operation. |
| 27 | * The bitmap operations that return Boolean (bitmap_empty, |
| 28 | * for example) or scalar (bitmap_weight, for example) results |
| 29 | * carefully filter out these unused bits from impacting their |
| 30 | * results. |
| 31 | * |
| 32 | * These operations actually hold to a slightly stronger rule: |
| 33 | * if you don't input any bitmaps to these ops that have some |
| 34 | * unused bits set, then they won't output any set unused bits |
| 35 | * in output bitmaps. |
| 36 | * |
| 37 | * The byte ordering of bitmaps is more natural on little |
| 38 | * endian architectures. |
| 39 | */ |
| 40 | |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 41 | int slow_bitmap_empty(const unsigned long *bitmap, long bits) |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 42 | { |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 43 | long k, lim = bits/BITS_PER_LONG; |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 44 | |
| 45 | for (k = 0; k < lim; ++k) { |
| 46 | if (bitmap[k]) { |
| 47 | return 0; |
| 48 | } |
| 49 | } |
| 50 | if (bits % BITS_PER_LONG) { |
| 51 | if (bitmap[k] & BITMAP_LAST_WORD_MASK(bits)) { |
| 52 | return 0; |
| 53 | } |
| 54 | } |
| 55 | |
| 56 | return 1; |
| 57 | } |
| 58 | |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 59 | int slow_bitmap_full(const unsigned long *bitmap, long bits) |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 60 | { |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 61 | long k, lim = bits/BITS_PER_LONG; |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 62 | |
| 63 | for (k = 0; k < lim; ++k) { |
| 64 | if (~bitmap[k]) { |
| 65 | return 0; |
| 66 | } |
| 67 | } |
| 68 | |
| 69 | if (bits % BITS_PER_LONG) { |
| 70 | if (~bitmap[k] & BITMAP_LAST_WORD_MASK(bits)) { |
| 71 | return 0; |
| 72 | } |
| 73 | } |
| 74 | |
| 75 | return 1; |
| 76 | } |
| 77 | |
| 78 | int slow_bitmap_equal(const unsigned long *bitmap1, |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 79 | const unsigned long *bitmap2, long bits) |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 80 | { |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 81 | long k, lim = bits/BITS_PER_LONG; |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 82 | |
| 83 | for (k = 0; k < lim; ++k) { |
| 84 | if (bitmap1[k] != bitmap2[k]) { |
| 85 | return 0; |
| 86 | } |
| 87 | } |
| 88 | |
| 89 | if (bits % BITS_PER_LONG) { |
| 90 | if ((bitmap1[k] ^ bitmap2[k]) & BITMAP_LAST_WORD_MASK(bits)) { |
| 91 | return 0; |
| 92 | } |
| 93 | } |
| 94 | |
| 95 | return 1; |
| 96 | } |
| 97 | |
| 98 | void slow_bitmap_complement(unsigned long *dst, const unsigned long *src, |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 99 | long bits) |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 100 | { |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 101 | long k, lim = bits/BITS_PER_LONG; |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 102 | |
| 103 | for (k = 0; k < lim; ++k) { |
| 104 | dst[k] = ~src[k]; |
| 105 | } |
| 106 | |
| 107 | if (bits % BITS_PER_LONG) { |
| 108 | dst[k] = ~src[k] & BITMAP_LAST_WORD_MASK(bits); |
| 109 | } |
| 110 | } |
| 111 | |
| 112 | int slow_bitmap_and(unsigned long *dst, const unsigned long *bitmap1, |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 113 | const unsigned long *bitmap2, long bits) |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 114 | { |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 115 | long k; |
| 116 | long nr = BITS_TO_LONGS(bits); |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 117 | unsigned long result = 0; |
| 118 | |
| 119 | for (k = 0; k < nr; k++) { |
| 120 | result |= (dst[k] = bitmap1[k] & bitmap2[k]); |
| 121 | } |
| 122 | return result != 0; |
| 123 | } |
| 124 | |
| 125 | void slow_bitmap_or(unsigned long *dst, const unsigned long *bitmap1, |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 126 | const unsigned long *bitmap2, long bits) |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 127 | { |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 128 | long k; |
| 129 | long nr = BITS_TO_LONGS(bits); |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 130 | |
| 131 | for (k = 0; k < nr; k++) { |
| 132 | dst[k] = bitmap1[k] | bitmap2[k]; |
| 133 | } |
| 134 | } |
| 135 | |
| 136 | void slow_bitmap_xor(unsigned long *dst, const unsigned long *bitmap1, |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 137 | const unsigned long *bitmap2, long bits) |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 138 | { |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 139 | long k; |
| 140 | long nr = BITS_TO_LONGS(bits); |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 141 | |
| 142 | for (k = 0; k < nr; k++) { |
| 143 | dst[k] = bitmap1[k] ^ bitmap2[k]; |
| 144 | } |
| 145 | } |
| 146 | |
| 147 | int slow_bitmap_andnot(unsigned long *dst, const unsigned long *bitmap1, |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 148 | const unsigned long *bitmap2, long bits) |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 149 | { |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 150 | long k; |
| 151 | long nr = BITS_TO_LONGS(bits); |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 152 | unsigned long result = 0; |
| 153 | |
| 154 | for (k = 0; k < nr; k++) { |
| 155 | result |= (dst[k] = bitmap1[k] & ~bitmap2[k]); |
| 156 | } |
| 157 | return result != 0; |
| 158 | } |
| 159 | |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 160 | void bitmap_set(unsigned long *map, long start, long nr) |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 161 | { |
| 162 | unsigned long *p = map + BIT_WORD(start); |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 163 | const long size = start + nr; |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 164 | int bits_to_set = BITS_PER_LONG - (start % BITS_PER_LONG); |
| 165 | unsigned long mask_to_set = BITMAP_FIRST_WORD_MASK(start); |
| 166 | |
Peter Lieven | e12ed72 | 2017-01-19 17:43:50 +0100 | [diff] [blame] | 167 | assert(start >= 0 && nr >= 0); |
| 168 | |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 169 | while (nr - bits_to_set >= 0) { |
| 170 | *p |= mask_to_set; |
| 171 | nr -= bits_to_set; |
| 172 | bits_to_set = BITS_PER_LONG; |
| 173 | mask_to_set = ~0UL; |
| 174 | p++; |
| 175 | } |
| 176 | if (nr) { |
| 177 | mask_to_set &= BITMAP_LAST_WORD_MASK(size); |
| 178 | *p |= mask_to_set; |
| 179 | } |
| 180 | } |
| 181 | |
Stefan Hajnoczi | 9f02cfc | 2014-12-02 11:23:14 +0000 | [diff] [blame] | 182 | void bitmap_set_atomic(unsigned long *map, long start, long nr) |
| 183 | { |
| 184 | unsigned long *p = map + BIT_WORD(start); |
| 185 | const long size = start + nr; |
| 186 | int bits_to_set = BITS_PER_LONG - (start % BITS_PER_LONG); |
| 187 | unsigned long mask_to_set = BITMAP_FIRST_WORD_MASK(start); |
| 188 | |
Peter Lieven | e12ed72 | 2017-01-19 17:43:50 +0100 | [diff] [blame] | 189 | assert(start >= 0 && nr >= 0); |
| 190 | |
Stefan Hajnoczi | 9f02cfc | 2014-12-02 11:23:14 +0000 | [diff] [blame] | 191 | /* First word */ |
| 192 | if (nr - bits_to_set > 0) { |
Stefan Hajnoczi | d73415a | 2020-09-23 11:56:46 +0100 | [diff] [blame] | 193 | qatomic_or(p, mask_to_set); |
Stefan Hajnoczi | 9f02cfc | 2014-12-02 11:23:14 +0000 | [diff] [blame] | 194 | nr -= bits_to_set; |
| 195 | bits_to_set = BITS_PER_LONG; |
| 196 | mask_to_set = ~0UL; |
| 197 | p++; |
| 198 | } |
| 199 | |
| 200 | /* Full words */ |
| 201 | if (bits_to_set == BITS_PER_LONG) { |
| 202 | while (nr >= BITS_PER_LONG) { |
| 203 | *p = ~0UL; |
| 204 | nr -= BITS_PER_LONG; |
| 205 | p++; |
| 206 | } |
| 207 | } |
| 208 | |
| 209 | /* Last word */ |
| 210 | if (nr) { |
| 211 | mask_to_set &= BITMAP_LAST_WORD_MASK(size); |
Stefan Hajnoczi | d73415a | 2020-09-23 11:56:46 +0100 | [diff] [blame] | 212 | qatomic_or(p, mask_to_set); |
Stefan Hajnoczi | 9f02cfc | 2014-12-02 11:23:14 +0000 | [diff] [blame] | 213 | } else { |
Stefan Hajnoczi | d73415a | 2020-09-23 11:56:46 +0100 | [diff] [blame] | 214 | /* If we avoided the full barrier in qatomic_or(), issue a |
Stefan Hajnoczi | 9f02cfc | 2014-12-02 11:23:14 +0000 | [diff] [blame] | 215 | * barrier to account for the assignments in the while loop. |
| 216 | */ |
| 217 | smp_mb(); |
| 218 | } |
| 219 | } |
| 220 | |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 221 | void bitmap_clear(unsigned long *map, long start, long nr) |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 222 | { |
| 223 | unsigned long *p = map + BIT_WORD(start); |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 224 | const long size = start + nr; |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 225 | int bits_to_clear = BITS_PER_LONG - (start % BITS_PER_LONG); |
| 226 | unsigned long mask_to_clear = BITMAP_FIRST_WORD_MASK(start); |
| 227 | |
Peter Lieven | e12ed72 | 2017-01-19 17:43:50 +0100 | [diff] [blame] | 228 | assert(start >= 0 && nr >= 0); |
| 229 | |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 230 | while (nr - bits_to_clear >= 0) { |
| 231 | *p &= ~mask_to_clear; |
| 232 | nr -= bits_to_clear; |
| 233 | bits_to_clear = BITS_PER_LONG; |
| 234 | mask_to_clear = ~0UL; |
| 235 | p++; |
| 236 | } |
| 237 | if (nr) { |
| 238 | mask_to_clear &= BITMAP_LAST_WORD_MASK(size); |
| 239 | *p &= ~mask_to_clear; |
| 240 | } |
| 241 | } |
| 242 | |
Peter Xu | cedb70e | 2022-10-04 14:24:29 -0400 | [diff] [blame] | 243 | bool bitmap_test_and_clear(unsigned long *map, long start, long nr) |
| 244 | { |
| 245 | unsigned long *p = map + BIT_WORD(start); |
| 246 | const long size = start + nr; |
| 247 | int bits_to_clear = BITS_PER_LONG - (start % BITS_PER_LONG); |
| 248 | unsigned long mask_to_clear = BITMAP_FIRST_WORD_MASK(start); |
| 249 | bool dirty = false; |
| 250 | |
| 251 | assert(start >= 0 && nr >= 0); |
| 252 | |
| 253 | /* First word */ |
| 254 | if (nr - bits_to_clear > 0) { |
| 255 | if ((*p) & mask_to_clear) { |
| 256 | dirty = true; |
| 257 | } |
| 258 | *p &= ~mask_to_clear; |
| 259 | nr -= bits_to_clear; |
| 260 | bits_to_clear = BITS_PER_LONG; |
| 261 | p++; |
| 262 | } |
| 263 | |
| 264 | /* Full words */ |
| 265 | if (bits_to_clear == BITS_PER_LONG) { |
| 266 | while (nr >= BITS_PER_LONG) { |
| 267 | if (*p) { |
| 268 | dirty = true; |
| 269 | *p = 0; |
| 270 | } |
| 271 | nr -= BITS_PER_LONG; |
| 272 | p++; |
| 273 | } |
| 274 | } |
| 275 | |
| 276 | /* Last word */ |
| 277 | if (nr) { |
| 278 | mask_to_clear &= BITMAP_LAST_WORD_MASK(size); |
| 279 | if ((*p) & mask_to_clear) { |
| 280 | dirty = true; |
| 281 | } |
| 282 | *p &= ~mask_to_clear; |
| 283 | } |
| 284 | |
| 285 | return dirty; |
| 286 | } |
| 287 | |
Stefan Hajnoczi | 36546e5 | 2014-12-02 11:23:15 +0000 | [diff] [blame] | 288 | bool bitmap_test_and_clear_atomic(unsigned long *map, long start, long nr) |
| 289 | { |
| 290 | unsigned long *p = map + BIT_WORD(start); |
| 291 | const long size = start + nr; |
| 292 | int bits_to_clear = BITS_PER_LONG - (start % BITS_PER_LONG); |
| 293 | unsigned long mask_to_clear = BITMAP_FIRST_WORD_MASK(start); |
| 294 | unsigned long dirty = 0; |
| 295 | unsigned long old_bits; |
| 296 | |
Peter Lieven | e12ed72 | 2017-01-19 17:43:50 +0100 | [diff] [blame] | 297 | assert(start >= 0 && nr >= 0); |
| 298 | |
Stefan Hajnoczi | 36546e5 | 2014-12-02 11:23:15 +0000 | [diff] [blame] | 299 | /* First word */ |
| 300 | if (nr - bits_to_clear > 0) { |
Stefan Hajnoczi | d73415a | 2020-09-23 11:56:46 +0100 | [diff] [blame] | 301 | old_bits = qatomic_fetch_and(p, ~mask_to_clear); |
Stefan Hajnoczi | 36546e5 | 2014-12-02 11:23:15 +0000 | [diff] [blame] | 302 | dirty |= old_bits & mask_to_clear; |
| 303 | nr -= bits_to_clear; |
| 304 | bits_to_clear = BITS_PER_LONG; |
| 305 | mask_to_clear = ~0UL; |
| 306 | p++; |
| 307 | } |
| 308 | |
| 309 | /* Full words */ |
| 310 | if (bits_to_clear == BITS_PER_LONG) { |
| 311 | while (nr >= BITS_PER_LONG) { |
| 312 | if (*p) { |
Stefan Hajnoczi | d73415a | 2020-09-23 11:56:46 +0100 | [diff] [blame] | 313 | old_bits = qatomic_xchg(p, 0); |
Stefan Hajnoczi | 36546e5 | 2014-12-02 11:23:15 +0000 | [diff] [blame] | 314 | dirty |= old_bits; |
| 315 | } |
| 316 | nr -= BITS_PER_LONG; |
| 317 | p++; |
| 318 | } |
| 319 | } |
| 320 | |
| 321 | /* Last word */ |
| 322 | if (nr) { |
| 323 | mask_to_clear &= BITMAP_LAST_WORD_MASK(size); |
Stefan Hajnoczi | d73415a | 2020-09-23 11:56:46 +0100 | [diff] [blame] | 324 | old_bits = qatomic_fetch_and(p, ~mask_to_clear); |
Stefan Hajnoczi | 36546e5 | 2014-12-02 11:23:15 +0000 | [diff] [blame] | 325 | dirty |= old_bits & mask_to_clear; |
| 326 | } else { |
| 327 | if (!dirty) { |
| 328 | smp_mb(); |
| 329 | } |
| 330 | } |
| 331 | |
| 332 | return dirty != 0; |
| 333 | } |
| 334 | |
Gerd Hoffmann | d6eb141 | 2017-04-21 11:16:24 +0200 | [diff] [blame] | 335 | void bitmap_copy_and_clear_atomic(unsigned long *dst, unsigned long *src, |
| 336 | long nr) |
| 337 | { |
| 338 | while (nr > 0) { |
Stefan Hajnoczi | d73415a | 2020-09-23 11:56:46 +0100 | [diff] [blame] | 339 | *dst = qatomic_xchg(src, 0); |
Gerd Hoffmann | d6eb141 | 2017-04-21 11:16:24 +0200 | [diff] [blame] | 340 | dst++; |
| 341 | src++; |
| 342 | nr -= BITS_PER_LONG; |
| 343 | } |
| 344 | } |
| 345 | |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 346 | #define ALIGN_MASK(x,mask) (((x)+(mask))&~(mask)) |
| 347 | |
| 348 | /** |
| 349 | * bitmap_find_next_zero_area - find a contiguous aligned zero area |
| 350 | * @map: The address to base the search on |
| 351 | * @size: The bitmap size in bits |
| 352 | * @start: The bitnumber to start searching at |
| 353 | * @nr: The number of zeroed bits we're looking for |
| 354 | * @align_mask: Alignment mask for zero area |
| 355 | * |
| 356 | * The @align_mask should be one less than a power of 2; the effect is that |
| 357 | * the bit offset of all zero areas this function finds is multiples of that |
| 358 | * power of 2. A @align_mask of 0 means no alignment is required. |
| 359 | */ |
| 360 | unsigned long bitmap_find_next_zero_area(unsigned long *map, |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 361 | unsigned long size, |
| 362 | unsigned long start, |
| 363 | unsigned long nr, |
| 364 | unsigned long align_mask) |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 365 | { |
| 366 | unsigned long index, end, i; |
| 367 | again: |
| 368 | index = find_next_zero_bit(map, size, start); |
| 369 | |
| 370 | /* Align allocation */ |
| 371 | index = ALIGN_MASK(index, align_mask); |
| 372 | |
| 373 | end = index + nr; |
| 374 | if (end > size) { |
| 375 | return end; |
| 376 | } |
| 377 | i = find_next_bit(map, end, index); |
| 378 | if (i < end) { |
| 379 | start = i + 1; |
| 380 | goto again; |
| 381 | } |
| 382 | return index; |
| 383 | } |
| 384 | |
| 385 | int slow_bitmap_intersects(const unsigned long *bitmap1, |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 386 | const unsigned long *bitmap2, long bits) |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 387 | { |
Juan Quintela | 9c22687 | 2013-12-17 12:12:24 +0100 | [diff] [blame] | 388 | long k, lim = bits/BITS_PER_LONG; |
Corentin Chary | e0e53b2 | 2011-02-04 09:06:04 +0100 | [diff] [blame] | 389 | |
| 390 | for (k = 0; k < lim; ++k) { |
| 391 | if (bitmap1[k] & bitmap2[k]) { |
| 392 | return 1; |
| 393 | } |
| 394 | } |
| 395 | |
| 396 | if (bits % BITS_PER_LONG) { |
| 397 | if ((bitmap1[k] & bitmap2[k]) & BITMAP_LAST_WORD_MASK(bits)) { |
| 398 | return 1; |
| 399 | } |
| 400 | } |
| 401 | return 0; |
| 402 | } |
Peter Xu | fc7deee | 2017-08-30 16:31:59 +0800 | [diff] [blame] | 403 | |
| 404 | long slow_bitmap_count_one(const unsigned long *bitmap, long nbits) |
| 405 | { |
| 406 | long k, lim = nbits / BITS_PER_LONG, result = 0; |
| 407 | |
| 408 | for (k = 0; k < lim; k++) { |
| 409 | result += ctpopl(bitmap[k]); |
| 410 | } |
| 411 | |
| 412 | if (nbits % BITS_PER_LONG) { |
| 413 | result += ctpopl(bitmap[k] & BITMAP_LAST_WORD_MASK(nbits)); |
| 414 | } |
| 415 | |
| 416 | return result; |
| 417 | } |
Peter Xu | d778815 | 2017-08-30 16:32:00 +0800 | [diff] [blame] | 418 | |
| 419 | static void bitmap_to_from_le(unsigned long *dst, |
| 420 | const unsigned long *src, long nbits) |
| 421 | { |
| 422 | long len = BITS_TO_LONGS(nbits); |
| 423 | |
Marc-André Lureau | e03b568 | 2022-03-23 19:57:17 +0400 | [diff] [blame] | 424 | #if HOST_BIG_ENDIAN |
Peter Xu | d778815 | 2017-08-30 16:32:00 +0800 | [diff] [blame] | 425 | long index; |
| 426 | |
| 427 | for (index = 0; index < len; index++) { |
| 428 | # if HOST_LONG_BITS == 64 |
| 429 | dst[index] = bswap64(src[index]); |
| 430 | # else |
| 431 | dst[index] = bswap32(src[index]); |
| 432 | # endif |
| 433 | } |
| 434 | #else |
| 435 | memcpy(dst, src, len * sizeof(unsigned long)); |
| 436 | #endif |
| 437 | } |
| 438 | |
| 439 | void bitmap_from_le(unsigned long *dst, const unsigned long *src, |
| 440 | long nbits) |
| 441 | { |
| 442 | bitmap_to_from_le(dst, src, nbits); |
| 443 | } |
| 444 | |
| 445 | void bitmap_to_le(unsigned long *dst, const unsigned long *src, |
| 446 | long nbits) |
| 447 | { |
| 448 | bitmap_to_from_le(dst, src, nbits); |
| 449 | } |
Peter Xu | ad37f24 | 2019-06-03 14:50:49 +0800 | [diff] [blame] | 450 | |
| 451 | /* |
| 452 | * Copy "src" bitmap with a positive offset and put it into the "dst" |
| 453 | * bitmap. The caller needs to make sure the bitmap size of "src" |
| 454 | * is bigger than (shift + nbits). |
| 455 | */ |
| 456 | void bitmap_copy_with_src_offset(unsigned long *dst, const unsigned long *src, |
| 457 | unsigned long shift, unsigned long nbits) |
| 458 | { |
| 459 | unsigned long left_mask, right_mask, last_mask; |
| 460 | |
| 461 | /* Proper shift src pointer to the first word to copy from */ |
| 462 | src += BIT_WORD(shift); |
| 463 | shift %= BITS_PER_LONG; |
| 464 | |
| 465 | if (!shift) { |
| 466 | /* Fast path */ |
| 467 | bitmap_copy(dst, src, nbits); |
| 468 | return; |
| 469 | } |
| 470 | |
| 471 | right_mask = (1ul << shift) - 1; |
| 472 | left_mask = ~right_mask; |
| 473 | |
| 474 | while (nbits >= BITS_PER_LONG) { |
| 475 | *dst = (*src & left_mask) >> shift; |
| 476 | *dst |= (src[1] & right_mask) << (BITS_PER_LONG - shift); |
| 477 | dst++; |
| 478 | src++; |
| 479 | nbits -= BITS_PER_LONG; |
| 480 | } |
| 481 | |
| 482 | if (nbits > BITS_PER_LONG - shift) { |
| 483 | *dst = (*src & left_mask) >> shift; |
| 484 | nbits -= BITS_PER_LONG - shift; |
| 485 | last_mask = (1ul << nbits) - 1; |
| 486 | *dst |= (src[1] & last_mask) << (BITS_PER_LONG - shift); |
| 487 | } else if (nbits) { |
| 488 | last_mask = (1ul << nbits) - 1; |
| 489 | *dst = (*src >> shift) & last_mask; |
| 490 | } |
| 491 | } |
| 492 | |
| 493 | /* |
| 494 | * Copy "src" bitmap into the "dst" bitmap with an offset in the |
| 495 | * "dst". The caller needs to make sure the bitmap size of "dst" is |
| 496 | * bigger than (shift + nbits). |
| 497 | */ |
| 498 | void bitmap_copy_with_dst_offset(unsigned long *dst, const unsigned long *src, |
| 499 | unsigned long shift, unsigned long nbits) |
| 500 | { |
| 501 | unsigned long left_mask, right_mask, last_mask; |
| 502 | |
| 503 | /* Proper shift dst pointer to the first word to copy from */ |
| 504 | dst += BIT_WORD(shift); |
| 505 | shift %= BITS_PER_LONG; |
| 506 | |
| 507 | if (!shift) { |
| 508 | /* Fast path */ |
| 509 | bitmap_copy(dst, src, nbits); |
| 510 | return; |
| 511 | } |
| 512 | |
| 513 | right_mask = (1ul << (BITS_PER_LONG - shift)) - 1; |
| 514 | left_mask = ~right_mask; |
| 515 | |
| 516 | *dst &= (1ul << shift) - 1; |
| 517 | while (nbits >= BITS_PER_LONG) { |
| 518 | *dst |= (*src & right_mask) << shift; |
| 519 | dst[1] = (*src & left_mask) >> (BITS_PER_LONG - shift); |
| 520 | dst++; |
| 521 | src++; |
| 522 | nbits -= BITS_PER_LONG; |
| 523 | } |
| 524 | |
| 525 | if (nbits > BITS_PER_LONG - shift) { |
| 526 | *dst |= (*src & right_mask) << shift; |
| 527 | nbits -= BITS_PER_LONG - shift; |
| 528 | last_mask = ((1ul << nbits) - 1) << (BITS_PER_LONG - shift); |
| 529 | dst[1] = (*src & last_mask) >> (BITS_PER_LONG - shift); |
| 530 | } else if (nbits) { |
| 531 | last_mask = (1ul << nbits) - 1; |
| 532 | *dst |= (*src & last_mask) << shift; |
| 533 | } |
| 534 | } |