OpenSDN source code
All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Pages
bitset.cc
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2013 Juniper Networks, Inc. All rights reserved.
3  */
4 
5 #include "base/bitset.h"
6 
7 #include <cassert>
8 #include <sstream>
9 #include <string>
10 #include <string.h>
11 
12 #include "base/util.h"
13 #include "base/string_util.h"
14 
15 using namespace std;
16 
17 //
18 // Provides the same functionality as ffsl. Needed as ffsl is not supported
19 // on all platforms. Note that the positions are numbered 1 through 64, with
20 // a return value of 0 indicating that there are no set bits.
21 //
22 static int find_first_set64(uint64_t value) {
23  int bit;
24 
25  int lower = static_cast<int>(value);
26  if ((bit = ffs(lower)) > 0)
27  return bit;
28 
29  int upper = value >> 32;
30  if ((bit = ffs(upper)) > 0)
31  return 32 + bit;
32 
33  return 0;
34 }
35 
36 static int find_first_clear64(uint64_t value) {
37  return find_first_set64(~value);
38 }
39 
40 //
41 // Provides the same functionality as fls. Needed as fls is not supported
42 // on all platforms. Note that the positions are numbered 1 through 32, with
43 // a return value of 0 indicating that there are no set bits.
44 //
45 static int find_last_set32(uint32_t value) {
46  if (value == 0)
47  return 0;
48 
49  int bit = 32;
50  if ((value & 0xFFFF0000U) == 0) {
51  value <<= 16;
52  bit -= 16;
53  }
54  if ((value & 0xFF000000U) == 0) {
55  value <<= 8;
56  bit -= 8;
57  }
58  if ((value & 0xF0000000U) == 0) {
59  value <<= 4;
60  bit -= 4;
61  }
62  if ((value & 0xC0000000U) == 0) {
63  value <<= 2;
64  bit -= 2;
65  }
66  if ((value & 0x80000000U) == 0) {
67  value <<= 1;
68  bit -= 1;
69  }
70 
71  return bit;
72 }
73 
74 //
75 // Provides the same functionality as flsl. Needed as flsl is not supported
76 // on all platforms. Note that the positions are numbered 1 through 64, with
77 // a return value of 0 indicating that there are no set bits.
78 //
79 static int find_last_set64(uint64_t value) {
80  int bit;
81 
82  int upper = value >> 32;
83  if ((bit = find_last_set32(upper)) > 0)
84  return 32 + bit;
85 
86  int lower = static_cast<int>(value);
87  if ((bit = find_last_set32(lower)) > 0)
88  return bit;
89 
90  return 0;
91 }
92 
93 //
94 // Return the number of set bits. K&R method.
95 //
96 static int num_bits_set(uint64_t value) {
97  int count = 0;
98  while (value != 0) {
99  value &= value - 1;
100  count++;
101  }
102  return count;
103 }
104 
105 // Position pos is w.r.t the entire bitset, starts at 0.
106 // Index idx is the block number i.e. the index in the vector, starts at 0.
107 // Offset offset is w.r.t a given 64 bit block, starts at 0.
108 static inline size_t block_index(size_t pos) {
109  return pos / 64;
110 }
111 
112 static inline size_t block_offset(size_t pos) {
113  return pos % 64;
114 }
115 
116 static inline size_t bit_position(size_t idx, size_t offset) {
117  return (idx * 64 + offset);
118 }
119 
120 const size_t BitSet::npos;
121 
122 //
123 // Set bit at given position, growing the vector if needed.
124 //
125 BitSet &BitSet::set(size_t pos) {
126  size_t idx = block_index(pos);
127  if (idx >= blocks_.size())
128  blocks_.resize(idx + 1);
129  blocks_[idx] |= 1LL << block_offset(pos);
130  return *this;
131 }
132 
133 //
134 // Reset bit at given position, shrinking the vector if possible.
135 //
136 BitSet &BitSet::reset(size_t pos) {
137  size_t idx = block_index(pos);
138  if (idx < blocks_.size()) {
139  blocks_[idx] &= ~(1LL << block_offset(pos));
140  compact();
141  }
142  return *this;
143 }
144 
145 // Test bit at given position.
146 bool BitSet::test(size_t pos) const {
147  size_t idx = block_index(pos);
148  if (idx < blocks_.size()) {
149  return ((blocks_[idx] & (1LL << block_offset(pos))) != 0);
150  } else {
151  return false;
152  }
153 }
154 
155 //
156 // Shortcut to reset all bits in the bitset.
157 //
159  blocks_.resize(0);
160 }
161 
162 //
163 // Return true if there are no bits in the bitset.
164 //
165 bool BitSet::empty() const {
166  return (blocks_.size() == 0);
167 }
168 
169 //
170 // Return true if no bits are set.
171 //
172 bool BitSet::none() const {
173  return (blocks_.size() == 0);
174 }
175 
176 //
177 // Return true at least one bit is set.
178 //
179 bool BitSet::any() const {
180  return (blocks_.size() != 0);
181 }
182 
183 //
184 // Return the raw number of bits in the bitset. Simply depends on the number
185 // of blocks in the vector.
186 //
187 size_t BitSet::size() const {
188  return blocks_.size() * 64;
189 }
190 
191 //
192 // Return total number of set bits.
193 //
194 size_t BitSet::count() const {
195  size_t count = 0;
196  for (size_t idx = 0; idx < blocks_.size(); idx++) {
197  count += num_bits_set(blocks_[idx]);
198  }
199  return count;
200 }
201 
202 //
203 // Shrink the underlying vector as much as possible. All trailing blocks
204 // that are 0 can be removed.
205 //
206 // Note that the for loop does not handle idx 0 since the loop variable
207 // is unsigned.
208 //
210  if (blocks_.size() == 0)
211  return;
212 
213  for (size_t idx = blocks_.size() - 1; idx > 0; idx--) {
214  if (blocks_[idx] != 0) {
215  blocks_.resize(idx + 1);
216  return;
217  }
218  }
219 
220  if (blocks_[0] != 0) {
221  blocks_.resize(1);
222  return;
223  }
224 
225  blocks_.clear();
226 }
227 
228 //
229 // Sanity check a bitset. The last block must never be 0. Always called
230 // after any compaction is done or in cases where no compaction is needed.
231 //
233  size_t mysize = blocks_.size();
234  if (mysize != 0)
235  assert(blocks_[mysize -1] != 0);
236 }
237 
238 //
239 // Return the position of the first set bit. Needs to compensate for the
240 // return value convention used by find_first_set64.
241 //
242 size_t BitSet::find_first() const {
243  for (size_t idx = 0; idx < blocks_.size(); idx++) {
244  int bit = find_first_set64(blocks_[idx]);
245  if (bit > 0)
246  return bit_position(idx, bit - 1);
247  }
248  return BitSet::npos;
249 }
250 
251 //
252 // Return the position of the next set bit. Needs to compensate for the
253 // return value convention used by find_first_set64.
254 //
255 size_t BitSet::find_next(size_t pos) const {
256  size_t idx = block_index(pos);
257 
258  // If the block index is beyond the vector, we're done.
259  if (idx >= blocks_.size())
260  return BitSet::npos;
261 
262  // If the offset is not 63, clear out the bits from 0 through offset
263  // and look for the first set bit.
264  if (block_offset(pos) < 63) {
265  uint64_t temp = blocks_[idx] & ~((1LL << (block_offset(pos) + 1)) - 1);
266  int bit = find_first_set64(temp);
267  if (bit > 0)
268  return bit_position(idx, bit - 1);
269  }
270 
271  // Go through all blocks after the start block for the pos and see if
272  // there's a set bit.
273  for (idx++; idx < blocks_.size(); idx++) {
274  int bit = find_first_set64(blocks_[idx]);
275  if (bit > 0)
276  return bit_position(idx, bit - 1);
277  }
278  return BitSet::npos;
279 }
280 
281 //
282 // Return the position of the last set bit. Needs to compensate for the
283 // return value convention used by find_last_set64.
284 //
285 // Note that we only need to look at the last block since that must have
286 // at least one bit set.
287 //
288 size_t BitSet::find_last() const {
289  if (blocks_.size() == 0)
290  return BitSet::npos;
291 
292  size_t idx = blocks_.size() - 1;
293  int bit = find_last_set64(blocks_[idx]);
294  if (bit > 0)
295  return bit_position(idx, bit - 1);
296 
297  return BitSet::npos;
298 }
299 
300 //
301 // Return the position of the first clear bit. It could be beyond the last
302 // block in the vector. This is fine as we automatically grow the vector if
303 // needed from set().
304 //
305 // Need to compensate for return value convention used by find_first_clear64.
306 //
307 size_t BitSet::find_first_clear() const {
308  for (size_t idx = 0; idx < blocks_.size(); idx++) {
309  int bit = find_first_clear64(blocks_[idx]);
310  if (bit > 0) {
311  return bit_position(idx, bit - 1);
312  }
313  }
314  return size();
315 }
316 
317 //
318 // Return the position of the next clear bit. It could be beyond the last
319 // block in the vector. This is fine as we automatically grow the vector if
320 // needed from set().
321 //
322 // Need to compensate for return value convention used by find_first_clear64.
323 //
324 size_t BitSet::find_next_clear(size_t pos) const {
325  size_t idx = block_index(pos);
326 
327  // If the block index is beyond the vector, we're done.
328  if (idx >= blocks_.size())
329  return pos + 1;
330 
331  // If the offset is not 63, set all the bits from 0 through offset and
332  // look for the first clear bit.
333  if (block_offset(pos) < 63) {
334  uint64_t temp = blocks_[idx] | ((1LL << (block_offset(pos) + 1)) - 1);
335  int bit = find_first_clear64(temp);
336  if (bit > 0)
337  return bit_position(idx, bit - 1);
338  }
339 
340  // Go through all blocks after the start block for the pos and see if
341  // there's a clear bit.
342  for (idx++; idx < blocks_.size(); idx++) {
343  int bit = find_first_clear64(blocks_[idx]);
344  if (bit > 0) {
345  return bit_position(idx, bit - 1);
346  }
347  }
348  return size();
349 }
350 
351 //
352 // Return (*this & rhs != 0).
353 //
354 bool BitSet::intersects(const BitSet &rhs) const {
355  size_t minsize = std::min(blocks_.size(), rhs.blocks_.size());
356  for (size_t idx = 0; idx < minsize; idx++) {
357  if (blocks_[idx] & rhs.blocks_[idx])
358  return true;
359  }
360  return false;
361 }
362 
363 //
364 // Return (*this == rhs).
365 //
366 // Note that it's fine to first compare the number of blocks in the vectors
367 // since we always shrink the vectors whenever possible.
368 //
369 bool BitSet::operator==(const BitSet &rhs) const {
370  if (blocks_.size() != rhs.blocks_.size())
371  return false;
372  for (size_t idx = 0; idx < blocks_.size(); idx++) {
373  if (blocks_[idx] != rhs.blocks_[idx])
374  return false;
375  }
376  return true;
377 }
378 
379 //
380 // Return (*this != rhs).
381 //
382 bool BitSet::operator!=(const BitSet &rhs) const {
383  return !operator==(rhs);
384 }
385 
386 //
387 // Return (*this & rhs).
388 //
389 BitSet BitSet::operator&(const BitSet &rhs) const {
390  BitSet temp;
391  temp.BuildIntersection(*this, rhs);
392  temp.check_invariants();
393  return temp;
394 }
395 
396 //
397 // Return (*this | rhs).
398 //
399 BitSet BitSet::operator|(const BitSet &rhs) const {
400  BitSet temp;
401  size_t minsize = std::min(blocks_.size(), rhs.blocks_.size());
402  size_t maxsize = std::max(blocks_.size(), rhs.blocks_.size());
403  temp.blocks_.resize(maxsize);
404 
405  // Process common blocks.
406  for (size_t idx = 0; idx < minsize; idx++) {
407  temp.blocks_[idx] = blocks_[idx] | rhs.blocks_[idx];
408  }
409 
410  // Process blocks that exist in LHS only. It's a noop if RHS is bigger.
411  for (size_t idx = minsize; idx < blocks_.size(); idx++) {
412  temp.blocks_[idx] = blocks_[idx];
413  }
414 
415  // Process blocks that exist in RHS only. It's a noop if LHS is bigger.
416  for (size_t idx = minsize; idx < rhs.blocks_.size(); idx++) {
417  temp.blocks_[idx] = rhs.blocks_[idx];
418  }
419 
420  temp.check_invariants();
421  return temp;
422 }
423 
424 //
425 // Implement (*this &= rhs).
426 //
427 // Note that we can't simply resize the vector to minsize since we may be
428 // able to shrink it even more depending on the values in the blocks.
429 //
431  size_t minsize = std::min(blocks_.size(), rhs.blocks_.size());
432  for (size_t idx = 0; idx < minsize; idx++) {
433  blocks_[idx] &= rhs.blocks_[idx];
434  }
435  for (size_t idx = minsize; idx < blocks_.size(); idx++) {
436  blocks_[idx] = 0;
437  }
438  compact();
439  check_invariants();
440  return *this;
441 }
442 
443 //
444 // Implement (*this |= rhs).
445 //
446 // Note that we grow the vector only once instead of doing it multiple
447 // times.
448 //
450  if (blocks_.size() < rhs.blocks_.size())
451  blocks_.resize(rhs.blocks_.size());
452  for (size_t idx = 0; idx < rhs.blocks_.size(); idx++) {
453  blocks_[idx] |= rhs.blocks_[idx];
454  }
455  check_invariants();
456  return *this;
457 }
458 
459 //
460 // Identical to operator|=.
461 //
462 void BitSet::Set(const BitSet &rhs) {
463  this->operator|=(rhs);
464  check_invariants();
465 }
466 
467 //
468 // Implement (*this &= ~rhs).
469 //
470 void BitSet::Reset(const BitSet &rhs) {
471  size_t minsize = std::min(blocks_.size(), rhs.blocks_.size());
472  for (size_t idx = 0; idx < minsize; idx++) {
473  blocks_[idx] &= ~rhs.blocks_[idx];
474  }
475  compact();
476  check_invariants();
477 }
478 
479 //
480 // Implement (*this = lhs & ~rhs).
481 //
482 // Note that we won't enter the second for loop at all if lhs is not bigger
483 // than rhs. Need to compact only for this case, but it is cheap enough to
484 // try (and do nothing) when lhs is bigger than rhs.
485 //
486 void BitSet::BuildComplement(const BitSet &lhs, const BitSet &rhs) {
487  blocks_.clear();
488  blocks_.resize(lhs.blocks_.size());
489  size_t minsize = std::min(blocks_.size(), rhs.blocks_.size());
490  for (size_t idx = 0; idx < minsize; idx++) {
491  blocks_[idx] = lhs.blocks_[idx] & ~rhs.blocks_[idx];
492  }
493  for (size_t idx = minsize; idx < lhs.blocks_.size(); idx++) {
494  blocks_[idx] = lhs.blocks_[idx];
495  }
496  compact();
497  check_invariants();
498 }
499 
500 //
501 // Implement (*this = lhs & rhs).
502 //
503 // We avoid the need to compact or to resize multiple times by building
504 // the blocks in reverse order.
505 //
506 // Note that the for loop does not handle idx 0 since the loop variable
507 // is unsigned.
508 //
509 void BitSet::BuildIntersection(const BitSet &lhs, const BitSet &rhs) {
510  blocks_.clear();
511  size_t minsize = std::min(lhs.blocks_.size(), rhs.blocks_.size());
512 
513  if (minsize == 0)
514  return;
515 
516  for (size_t idx = minsize - 1; idx > 0; idx--) {
517  if (lhs.blocks_[idx] & rhs.blocks_[idx]) {
518  if (blocks_.size() == 0)
519  blocks_.resize(idx + 1);
520  blocks_[idx] = lhs.blocks_[idx] & rhs.blocks_[idx];
521  }
522  }
523 
524  if (lhs.blocks_[0] & rhs.blocks_[0]) {
525  if (blocks_.size() == 0)
526  blocks_.resize(1);
527  blocks_[0] = lhs.blocks_[0] & rhs.blocks_[0];
528  }
529 
530  check_invariants();
531 }
532 
533 //
534 // Return true if *this contains rhs. Implemented as (rhs & ~*this != 0).
535 //
536 bool BitSet::Contains(const BitSet &rhs) const {
537  if (blocks_.size() < rhs.blocks_.size())
538  return false;
539  for (size_t idx = 0; idx < rhs.blocks_.size(); idx++) {
540  if (rhs.blocks_[idx] & ~blocks_[idx])
541  return false;
542  }
543  return true;
544 }
545 
546 //
547 // Returns string representation of the bitset. A character in the string is
548 // '1' if the corresponding bit is set, and '0' if it is not. The character
549 // position i in the string corresponds to bit position i in the bitset.
550 //
551 string BitSet::ToString() const {
552  size_t last_pos = find_last();
553  if (last_pos == BitSet::npos)
554  return string();
555 
556  string str(last_pos + 1, '0');
557  for (size_t pos = find_first(); pos != BitSet::npos; pos = find_next(pos)) {
558  str[pos] = '1';
559  }
560  return str;
561 }
562 
563 //
564 // Initialize the bitset from the provided string representation. The string
565 // must use the same format as described in ToString above. We traverse the
566 // string in reverse order to ensure that we do not have to resize multiple
567 // times.
568 //
569 // Note that the for loop does not handle str_idx 0 since the loop variable
570 // is unsigned.
571 //
572 void BitSet::FromString(string str) {
573  blocks_.clear();
574 
575  if (str.length() == 0)
576  return;
577 
578  for (size_t str_idx = str.length() - 1; str_idx > 0; str_idx--) {
579  if (str[str_idx] == '1')
580  set(str_idx);
581  }
582 
583  if (str[0] == '1')
584  set(0);
585 }
586 
587 //
588 // Returns numbered string representation of the bitset. The numbers are the
589 // bit positions that are set in the bitset. Consecutive bit positions are
590 // represented as x-y and a comma is used as a separator for non-consecutive
591 // positions.
592 //
593 string BitSet::ToNumberedString() const {
594  if (empty())
595  return "-";
596 
597  ostringstream oss;
598  bool range = false;
599  size_t last_pos = BitSet::npos;
600  for (size_t pos = find_first(); pos != BitSet::npos;
601  last_pos = pos, pos = find_next(pos)) {
602  if (last_pos == BitSet::npos) {
603  oss << integerToString(pos);
604  } else if (pos == last_pos + 1) {
605  range = true;
606  } else if (range) {
607  oss << "-" << integerToString(last_pos);
608  oss << "," << integerToString(pos);
609  range = false;
610  } else {
611  oss << "," << integerToString(pos);
612  }
613  }
614 
615  if (range)
616  oss << "-" << integerToString(last_pos);
617 
618  return oss.str();
619 }
void compact()
Definition: bitset.cc:209
void FromString(std::string str)
Definition: bitset.cc:572
bool test(size_t pos) const
Definition: bitset.cc:146
static int find_first_clear64(uint64_t value)
Definition: bitset.cc:36
BitSet & reset(size_t pos)
Definition: bitset.cc:136
std::string ToString() const
Definition: bitset.cc:551
void Reset(const BitSet &rhs)
Definition: bitset.cc:470
size_t count() const
Definition: bitset.cc:194
std::vector< uint64_t > blocks_
Definition: bitset.h:59
BitSet operator|(const BitSet &rhs) const
Definition: bitset.cc:399
void BuildIntersection(const BitSet &lhs, const BitSet &rhs)
Definition: bitset.cc:509
static int find_last_set64(uint64_t value)
Definition: bitset.cc:79
static int find_last_set32(uint32_t value)
Definition: bitset.cc:45
bool Contains(const BitSet &rhs) const
Definition: bitset.cc:536
bool empty() const
Definition: bitset.cc:165
bool operator==(const BitSet &rhs) const
Definition: bitset.cc:369
static size_t bit_position(size_t idx, size_t offset)
Definition: bitset.cc:116
size_t find_first_clear() const
Definition: bitset.cc:307
BitSet operator&(const BitSet &rhs) const
Definition: bitset.cc:389
static const std::string integerToString(const NumberType &num)
Definition: string_util.h:19
static const size_t npos
Definition: bitset.h:19
void check_invariants()
Definition: bitset.cc:232
void clear()
Definition: bitset.cc:158
size_t size() const
Definition: bitset.cc:187
bool operator==(const WaterMarkInfo &lhs, const WaterMarkInfo &rhs)
Definition: watermark.h:36
size_t find_last() const
Definition: bitset.cc:288
BitSet & operator|=(const BitSet &rhs)
Definition: bitset.cc:449
size_t find_next_clear(size_t pos) const
Definition: bitset.cc:324
void Set(const BitSet &rhs)
Definition: bitset.cc:462
Definition: bitset.h:17
BitSet & set(size_t pos)
Definition: bitset.cc:125
bool operator!=(const BitSet &rhs) const
Definition: bitset.cc:382
static int num_bits_set(uint64_t value)
Definition: bitset.cc:96
bool any() const
Definition: bitset.cc:179
static int find_first_set64(uint64_t value)
Definition: bitset.cc:22
bool none() const
Definition: bitset.cc:172
size_t find_first() const
Definition: bitset.cc:242
void BuildComplement(const BitSet &lhs, const BitSet &rhs)
Definition: bitset.cc:486
bool intersects(const BitSet &rhs) const
Definition: bitset.cc:354
size_t find_next(size_t pos) const
Definition: bitset.cc:255
std::string ToNumberedString() const
Definition: bitset.cc:593
static size_t block_offset(size_t pos)
Definition: bitset.cc:112
static size_t block_index(size_t pos)
Definition: bitset.cc:108
BitSet & operator&=(const BitSet &rhs)
Definition: bitset.cc:430