12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031 |
- /*
- A C++ header for Roaring Bitmaps.
- */
- #ifndef INCLUDE_ROARING_HH_
- #define INCLUDE_ROARING_HH_
- #include <algorithm>
- #include <cstdarg>
- #include <initializer_list>
- #include <limits>
- #include <new>
- #include <stdexcept>
- #include <string>
- #if !defined(ROARING_EXCEPTIONS)
- // __cpp_exceptions is required by C++98 and we require C++11 or better.
- #ifndef __cpp_exceptions
- #error "__cpp_exceptions should be defined"
- #endif
- #if __cpp_exceptions
- #define ROARING_EXCEPTIONS 1
- #else
- #define ROARING_EXCEPTIONS 0
- #endif
- #endif
- #ifndef ROARING_TERMINATE
- #if ROARING_EXCEPTIONS
- #define ROARING_TERMINATE(_s) throw std::runtime_error(_s)
- #else
- #define ROARING_TERMINATE(_s) std::terminate()
- #endif
- #endif
- #define ROARING_API_NOT_IN_GLOBAL_NAMESPACE // see remarks in roaring.h
- #include <roaring/roaring.h>
- #undef ROARING_API_NOT_IN_GLOBAL_NAMESPACE
- #include <roaring/roaring_array.h> // roaring::internal array functions used
- namespace roaring {
- class RoaringSetBitBiDirectionalIterator;
- /** DEPRECATED, use `RoaringSetBitBiDirectionalIterator`. */
- using RoaringSetBitForwardIterator = RoaringSetBitBiDirectionalIterator;
- /**
- * A bit of context usable with `*Bulk()` functions.
- *
- * A context may only be used with a single bitmap, and any modification to a
- * bitmap (other than modifications performed with `Bulk()` functions with the
- * context passed) will invalidate any contexts associated with that bitmap.
- */
- class BulkContext {
- public:
- friend class Roaring;
- using roaring_bitmap_bulk_context_t = api::roaring_bulk_context_t;
- BulkContext() : context_{nullptr, 0, 0, 0} {}
- BulkContext(const BulkContext &) = delete;
- BulkContext &operator=(const BulkContext &) = delete;
- BulkContext(BulkContext &&) noexcept = default;
- BulkContext &operator=(BulkContext &&) noexcept = default;
- private:
- roaring_bitmap_bulk_context_t context_;
- };
- class Roaring {
- typedef api::roaring_bitmap_t roaring_bitmap_t; // class-local name alias
- public:
- /**
- * Create an empty bitmap in the existing memory for the class.
- * The bitmap will be in the "clear" state with no auxiliary allocations.
- */
- Roaring() : roaring{} {
- // The empty constructor roaring{} silences warnings from pedantic
- // static analyzers.
- api::roaring_bitmap_init_cleared(&roaring);
- }
- /**
- * Construct a bitmap from a list of 32-bit integer values.
- */
- Roaring(size_t n, const uint32_t *data) : Roaring() {
- api::roaring_bitmap_add_many(&roaring, n, data);
- }
- /**
- * Construct a bitmap from an initializer list.
- */
- Roaring(std::initializer_list<uint32_t> l) : Roaring() {
- addMany(l.size(), l.begin());
- }
- /**
- * Construct a roaring object by taking control of a malloc()'d C struct.
- *
- * Passing a NULL pointer is unsafe.
- * The pointer to the C struct will be invalid after the call.
- */
- explicit Roaring(roaring_bitmap_t *s) noexcept : roaring(*s) {
- roaring_free(s); // deallocate the passed-in pointer
- }
- /**
- * Copy constructor.
- * It may throw std::runtime_error if there is insufficient memory.
- */
- Roaring(const Roaring &r) : Roaring() {
- if (!api::roaring_bitmap_overwrite(&roaring, &r.roaring)) {
- ROARING_TERMINATE("failed roaring_bitmap_overwrite in constructor");
- }
- api::roaring_bitmap_set_copy_on_write(
- &roaring, api::roaring_bitmap_get_copy_on_write(&r.roaring));
- }
- /**
- * Move constructor. The moved-from object remains valid but empty, i.e.
- * it behaves as though it was just freshly constructed.
- */
- Roaring(Roaring &&r) noexcept : roaring(r.roaring) {
- //
- // !!! This clones the bits of the roaring structure to a new location
- // and then overwrites the old bits...assuming that this will still
- // work. There are scenarios where this could break; e.g. if some of
- // those bits were pointers into the structure memory itself. If such
- // things were possible, a roaring_bitmap_move() API would be needed.
- //
- api::roaring_bitmap_init_cleared(&r.roaring);
- }
- /**
- * Construct a bitmap from a list of uint32_t values.
- */
- static Roaring bitmapOf(size_t n, ...) {
- Roaring ans;
- va_list vl;
- va_start(vl, n);
- for (size_t i = 0; i < n; i++) {
- ans.add(va_arg(vl, uint32_t));
- }
- va_end(vl);
- return ans;
- }
- /**
- * Copies the content of the provided bitmap, and
- * discard the current content.
- * It may throw std::runtime_error if there is insufficient memory.
- */
- Roaring &operator=(const Roaring &r) {
- if (!api::roaring_bitmap_overwrite(&roaring, &r.roaring)) {
- ROARING_TERMINATE("failed memory alloc in assignment");
- }
- api::roaring_bitmap_set_copy_on_write(
- &roaring, api::roaring_bitmap_get_copy_on_write(&r.roaring));
- return *this;
- }
- /**
- * Moves the content of the provided bitmap, and
- * discard the current content.
- */
- Roaring &operator=(Roaring &&r) noexcept {
- api::roaring_bitmap_clear(&roaring); // free this class's allocations
- // !!! See notes in the Move Constructor regarding roaring_bitmap_move()
- //
- roaring = r.roaring;
- api::roaring_bitmap_init_cleared(&r.roaring);
- return *this;
- }
- /**
- * Assignment from an initializer list.
- */
- Roaring &operator=(std::initializer_list<uint32_t> l) {
- // Delegate to move assignment operator
- *this = Roaring(l);
- return *this;
- }
- /**
- * Construct a bitmap from a list of uint32_t values.
- * E.g., bitmapOfList({1,2,3}).
- */
- static Roaring bitmapOfList(std::initializer_list<uint32_t> l) {
- Roaring ans;
- ans.addMany(l.size(), l.begin());
- return ans;
- }
- /**
- * Add value x
- */
- void add(uint32_t x) noexcept { api::roaring_bitmap_add(&roaring, x); }
- /**
- * Add value x
- * Returns true if a new value was added, false if the value was already
- * existing.
- */
- bool addChecked(uint32_t x) noexcept {
- return api::roaring_bitmap_add_checked(&roaring, x);
- }
- /**
- * Add all values in range [min, max)
- */
- void addRange(const uint64_t min, const uint64_t max) noexcept {
- return api::roaring_bitmap_add_range(&roaring, min, max);
- }
- /**
- * Add all values in range [min, max]
- */
- void addRangeClosed(const uint32_t min, const uint32_t max) noexcept {
- return api::roaring_bitmap_add_range_closed(&roaring, min, max);
- }
- /**
- * Add value n_args from pointer vals
- */
- void addMany(size_t n_args, const uint32_t *vals) noexcept {
- api::roaring_bitmap_add_many(&roaring, n_args, vals);
- }
- /**
- * Add value val, using context from a previous insert for speed
- * optimization.
- *
- * `context` will be used to store information between calls to make bulk
- * operations faster. `context` should be default-initialized before the
- * first call to this function.
- */
- void addBulk(BulkContext &context, uint32_t x) noexcept {
- api::roaring_bitmap_add_bulk(&roaring, &context.context_, x);
- }
- /**
- * Check if item x is present, using context from a previous insert or
- * search for speed optimization.
- *
- * `context` will be used to store information between calls to make bulk
- * operations faster. `context` should be default-initialized before the
- * first call to this function.
- */
- bool containsBulk(BulkContext &context, uint32_t x) const noexcept {
- return api::roaring_bitmap_contains_bulk(&roaring, &context.context_,
- x);
- }
- /**
- * Remove value x
- */
- void remove(uint32_t x) noexcept {
- api::roaring_bitmap_remove(&roaring, x);
- }
- /**
- * Remove value x
- * Returns true if a new value was removed, false if the value was not
- * existing.
- */
- bool removeChecked(uint32_t x) noexcept {
- return api::roaring_bitmap_remove_checked(&roaring, x);
- }
- /**
- * Remove all values in range [min, max)
- */
- void removeRange(uint64_t min, uint64_t max) noexcept {
- return api::roaring_bitmap_remove_range(&roaring, min, max);
- }
- /**
- * Remove all values in range [min, max]
- */
- void removeRangeClosed(uint32_t min, uint32_t max) noexcept {
- return api::roaring_bitmap_remove_range_closed(&roaring, min, max);
- }
- /**
- * Clears the bitmap.
- */
- void clear() { api::roaring_bitmap_clear(&roaring); }
- /**
- * Return the largest value (if not empty)
- */
- uint32_t maximum() const noexcept {
- return api::roaring_bitmap_maximum(&roaring);
- }
- /**
- * Return the smallest value (if not empty)
- */
- uint32_t minimum() const noexcept {
- return api::roaring_bitmap_minimum(&roaring);
- }
- /**
- * Check if value x is present
- */
- bool contains(uint32_t x) const noexcept {
- return api::roaring_bitmap_contains(&roaring, x);
- }
- /**
- * Check if all values from x (included) to y (excluded) are present
- */
- bool containsRange(const uint64_t x, const uint64_t y) const noexcept {
- return api::roaring_bitmap_contains_range(&roaring, x, y);
- }
- bool containsRangeClosed(const uint32_t x,
- const uint32_t y) const noexcept {
- return api::roaring_bitmap_contains_range_closed(&roaring, x, y);
- }
- /**
- * Compute the intersection between the current bitmap and the provided
- * bitmap, writing the result in the current bitmap. The provided bitmap
- * is not modified.
- *
- * Performance hint: if you are computing the intersection between several
- * bitmaps, two-by-two, it is best to start with the smallest bitmap.
- */
- Roaring &operator&=(const Roaring &r) noexcept {
- api::roaring_bitmap_and_inplace(&roaring, &r.roaring);
- return *this;
- }
- /**
- * Compute the difference between the current bitmap and the provided
- * bitmap, writing the result in the current bitmap. The provided bitmap
- * is not modified.
- */
- Roaring &operator-=(const Roaring &r) noexcept {
- api::roaring_bitmap_andnot_inplace(&roaring, &r.roaring);
- return *this;
- }
- /**
- * Compute the union between the current bitmap and the provided bitmap,
- * writing the result in the current bitmap. The provided bitmap is not
- * modified.
- *
- * See also the fastunion function to aggregate many bitmaps more quickly.
- */
- Roaring &operator|=(const Roaring &r) noexcept {
- api::roaring_bitmap_or_inplace(&roaring, &r.roaring);
- return *this;
- }
- /**
- * Compute the symmetric union between the current bitmap and the provided
- * bitmap, writing the result in the current bitmap. The provided bitmap
- * is not modified.
- */
- Roaring &operator^=(const Roaring &r) noexcept {
- api::roaring_bitmap_xor_inplace(&roaring, &r.roaring);
- return *this;
- }
- /**
- * Exchange the content of this bitmap with another.
- */
- void swap(Roaring &r) noexcept { std::swap(r.roaring, roaring); }
- /**
- * Get the cardinality of the bitmap (number of elements).
- */
- uint64_t cardinality() const noexcept {
- return api::roaring_bitmap_get_cardinality(&roaring);
- }
- /**
- * Returns true if the bitmap is empty (cardinality is zero).
- */
- bool isEmpty() const noexcept {
- return api::roaring_bitmap_is_empty(&roaring);
- }
- /**
- * Returns true if the bitmap is full (cardinality is uint32_t max + 1).
- * we put std::numeric_limits<>::max/min in parentheses
- * to avoid a clash with the Windows.h header under Windows.
- */
- bool isFull() const noexcept {
- return api::roaring_bitmap_get_cardinality(&roaring) ==
- ((uint64_t)(std::numeric_limits<uint32_t>::max)()) + 1;
- }
- /**
- * Returns true if the bitmap is subset of the other.
- */
- bool isSubset(const Roaring &r) const noexcept {
- return api::roaring_bitmap_is_subset(&roaring, &r.roaring);
- }
- /**
- * Returns true if the bitmap is strict subset of the other.
- */
- bool isStrictSubset(const Roaring &r) const noexcept {
- return api::roaring_bitmap_is_strict_subset(&roaring, &r.roaring);
- }
- /**
- * Convert the bitmap to an array. Write the output to "ans", caller is
- * responsible to ensure that there is enough memory allocated
- * (e.g., ans = new uint32[mybitmap.cardinality()];)
- */
- void toUint32Array(uint32_t *ans) const noexcept {
- api::roaring_bitmap_to_uint32_array(&roaring, ans);
- }
- /**
- * To int array with pagination
- */
- void rangeUint32Array(uint32_t *ans, size_t offset,
- size_t limit) const noexcept {
- api::roaring_bitmap_range_uint32_array(&roaring, offset, limit, ans);
- }
- /**
- * Return true if the two bitmaps contain the same elements.
- */
- bool operator==(const Roaring &r) const noexcept {
- return api::roaring_bitmap_equals(&roaring, &r.roaring);
- }
- /**
- * Compute the negation of the roaring bitmap within the half-open interval
- * [range_start, range_end). Areas outside the interval are unchanged.
- */
- void flip(uint64_t range_start, uint64_t range_end) noexcept {
- api::roaring_bitmap_flip_inplace(&roaring, range_start, range_end);
- }
- /**
- * Compute the negation of the roaring bitmap within the closed interval
- * [range_start, range_end]. Areas outside the interval are unchanged.
- */
- void flipClosed(uint32_t range_start, uint32_t range_end) noexcept {
- api::roaring_bitmap_flip_inplace_closed(&roaring, range_start,
- range_end);
- }
- /**
- * Remove run-length encoding even when it is more space efficient.
- * Return whether a change was applied.
- */
- bool removeRunCompression() noexcept {
- return api::roaring_bitmap_remove_run_compression(&roaring);
- }
- /**
- * Convert array and bitmap containers to run containers when it is more
- * efficient; also convert from run containers when more space efficient.
- * Returns true if the result has at least one run container. Additional
- * savings might be possible by calling shrinkToFit().
- */
- bool runOptimize() noexcept {
- return api::roaring_bitmap_run_optimize(&roaring);
- }
- /**
- * If needed, reallocate memory to shrink the memory usage. Returns
- * the number of bytes saved.
- */
- size_t shrinkToFit() noexcept {
- return api::roaring_bitmap_shrink_to_fit(&roaring);
- }
- /**
- * Iterate over the bitmap elements. The function iterator is called once
- * for all the values with ptr (can be NULL) as the second parameter of
- * each call.
- *
- * roaring_iterator is simply a pointer to a function that returns bool
- * (true means that the iteration should continue while false means that it
- * should stop), and takes (uint32_t,void*) as inputs.
- */
- void iterate(api::roaring_iterator iterator, void *ptr) const {
- api::roaring_iterate(&roaring, iterator, ptr);
- }
- /**
- * Selects the value at index rnk in the bitmap, where the smallest value
- * is at index 0.
- *
- * If the size of the roaring bitmap is strictly greater than rank, then
- * this function returns true and sets element to the element of given rank.
- * Otherwise, it returns false.
- */
- bool select(uint32_t rnk, uint32_t *element) const noexcept {
- return api::roaring_bitmap_select(&roaring, rnk, element);
- }
- /**
- * Computes the size of the intersection between two bitmaps.
- */
- uint64_t and_cardinality(const Roaring &r) const noexcept {
- return api::roaring_bitmap_and_cardinality(&roaring, &r.roaring);
- }
- /**
- * Check whether the two bitmaps intersect.
- */
- bool intersect(const Roaring &r) const noexcept {
- return api::roaring_bitmap_intersect(&roaring, &r.roaring);
- }
- /**
- * Computes the Jaccard index between two bitmaps. (Also known as the
- * Tanimoto distance,
- * or the Jaccard similarity coefficient)
- *
- * The Jaccard index is undefined if both bitmaps are empty.
- */
- double jaccard_index(const Roaring &r) const noexcept {
- return api::roaring_bitmap_jaccard_index(&roaring, &r.roaring);
- }
- /**
- * Computes the size of the union between two bitmaps.
- */
- uint64_t or_cardinality(const Roaring &r) const noexcept {
- return api::roaring_bitmap_or_cardinality(&roaring, &r.roaring);
- }
- /**
- * Computes the size of the difference (andnot) between two bitmaps.
- */
- uint64_t andnot_cardinality(const Roaring &r) const noexcept {
- return api::roaring_bitmap_andnot_cardinality(&roaring, &r.roaring);
- }
- /**
- * Computes the size of the symmetric difference (andnot) between two
- * bitmaps.
- */
- uint64_t xor_cardinality(const Roaring &r) const noexcept {
- return api::roaring_bitmap_xor_cardinality(&roaring, &r.roaring);
- }
- /**
- * Returns the number of integers that are smaller or equal to x.
- * Thus the rank of the smallest element is one. If
- * x is smaller than the smallest element, this function will return 0.
- * The rank and select functions differ in convention: this function returns
- * 1 when ranking the smallest value, but the select function returns the
- * smallest value when using index 0.
- */
- uint64_t rank(uint32_t x) const noexcept {
- return api::roaring_bitmap_rank(&roaring, x);
- }
- /**
- * Get `rank()` values in bulk. The values in `[begin .. end)` must be in
- * Ascending order. possible implementation: for(auto* iter = begin; iter !=
- * end; ++iter) *(ans++) = rank(*iter);
- */
- void rank_many(const uint32_t *begin, const uint32_t *end,
- uint64_t *ans) const noexcept {
- return api::roaring_bitmap_rank_many(&roaring, begin, end, ans);
- }
- /**
- * Returns the index of x in the set, index start from 0.
- * If the set doesn't contain x , this function will return -1.
- * The difference with rank function is that this function will return -1
- * when x isn't in the set, but the rank function will return a
- * non-negative number.
- */
- int64_t getIndex(uint32_t x) const noexcept {
- return api::roaring_bitmap_get_index(&roaring, x);
- }
- /**
- * Write a bitmap to a char buffer. This is meant to be compatible with
- * the Java and Go versions. Returns how many bytes were written which
- * should be getSizeInBytes().
- *
- * Setting the portable flag to false enable a custom format that
- * can save space compared to the portable format (e.g., for very
- * sparse bitmaps).
- *
- * Boost users can serialize bitmaps in this manner:
- *
- * BOOST_SERIALIZATION_SPLIT_FREE(Roaring)
- * namespace boost {
- * namespace serialization {
- *
- * template <class Archive>
- * void save(Archive& ar, const Roaring& bitmask,
- * const unsigned int version) {
- * std::size_t expected_size_in_bytes = bitmask.getSizeInBytes();
- * std::vector<char> buffer(expected_size_in_bytes);
- * std::size_t size_in_bytes = bitmask.write(buffer.data());
- *
- * ar& size_in_bytes;
- * ar& boost::serialization::make_binary_object(buffer.data(),
- * size_in_bytes);
- * }
- * template <class Archive>
- * void load(Archive& ar, Roaring& bitmask,
- * const unsigned int version) {
- * std::size_t size_in_bytes = 0;
- * ar& size_in_bytes;
- * std::vector<char> buffer(size_in_bytes);
- * ar& boost::serialization::make_binary_object(buffer.data(),
- * size_in_bytes);
- * bitmask = Roaring::readSafe(buffer.data(), size_in_bytes);
- * }
- * } // namespace serialization
- * } // namespace boost
- */
- size_t write(char *buf, bool portable = true) const noexcept {
- if (portable) {
- return api::roaring_bitmap_portable_serialize(&roaring, buf);
- } else {
- return api::roaring_bitmap_serialize(&roaring, buf);
- }
- }
- /**
- * Read a bitmap from a serialized version. This is meant to be compatible
- * with the Java and Go versions.
- *
- * Setting the portable flag to false enable a custom format that
- * can save space compared to the portable format (e.g., for very
- * sparse bitmaps).
- *
- * This function is unsafe in the sense that if you provide bad data,
- * many, many bytes could be read. See also readSafe.
- *
- * The function may throw std::runtime_error if a bitmap could not be read.
- * Not that even if it does not throw, the bitmap could still be unusable if
- * the loaded data does not match the portable Roaring specification: you
- * should ensure that the data you load come from a serialized bitmap.
- */
- static Roaring read(const char *buf, bool portable = true) {
- roaring_bitmap_t *r =
- portable ? api::roaring_bitmap_portable_deserialize(buf)
- : api::roaring_bitmap_deserialize(buf);
- if (r == NULL) {
- ROARING_TERMINATE("failed alloc while reading");
- }
- return Roaring(r);
- }
- /**
- * Read a bitmap from a serialized version, reading no more than maxbytes
- * bytes. This is meant to be compatible with the Java and Go versions.
- * The function itself is safe in the sense that it will not cause buffer
- * overflows. However, for correct operations, it is assumed that the bitmap
- * read was once serialized from a valid bitmap. If you provided an
- * incorrect input (garbage), then the bitmap read may not be in a valid
- * state and following operations may not lead to sensible results. It is
- * your responsability to ensure that the input bytes follow the format
- * specification if you want a usable bitmap:
- * https://github.com/RoaringBitmap/RoaringFormatSpec
- * In particular, the serialized array containers need to be in sorted
- * order, and the run containers should be in sorted non-overlapping order.
- * This is is guaranteed to happen when serializing an existing bitmap, but
- * not for random inputs. Note that this function assumes that your bitmap
- * was serialized in *portable* mode (which is the default with the 'write'
- * method).
- *
- * The function may throw std::runtime_error if a bitmap could not be read.
- * Not that even if it does not throw, the bitmap could still be unusable if
- * the loaded data does not match the portable Roaring specification: you
- * should ensure that the data you load come from a serialized bitmap.
- */
- static Roaring readSafe(const char *buf, size_t maxbytes) {
- roaring_bitmap_t *r =
- api::roaring_bitmap_portable_deserialize_safe(buf, maxbytes);
- if (r == NULL) {
- ROARING_TERMINATE("failed alloc while reading");
- }
- return Roaring(r);
- }
- /**
- * How many bytes are required to serialize this bitmap (meant to be
- * compatible with Java and Go versions)
- *
- * Setting the portable flag to false enable a custom format that
- * can save space compared to the portable format (e.g., for very
- * sparse bitmaps).
- */
- size_t getSizeInBytes(bool portable = true) const noexcept {
- if (portable) {
- return api::roaring_bitmap_portable_size_in_bytes(&roaring);
- } else {
- return api::roaring_bitmap_size_in_bytes(&roaring);
- }
- }
- /**
- * For advanced users.
- * This function may throw std::runtime_error.
- */
- static const Roaring frozenView(const char *buf, size_t length) {
- const roaring_bitmap_t *s =
- api::roaring_bitmap_frozen_view(buf, length);
- if (s == NULL) {
- ROARING_TERMINATE("failed to read frozen bitmap");
- }
- Roaring r;
- r.roaring = *s;
- return r;
- }
- /**
- * For advanced users; see roaring_bitmap_portable_deserialize_frozen.
- * This function may throw std::runtime_error.
- */
- static const Roaring portableDeserializeFrozen(const char *buf) {
- const roaring_bitmap_t *s =
- api::roaring_bitmap_portable_deserialize_frozen(buf);
- if (s == NULL) {
- ROARING_TERMINATE("failed to read portable frozen bitmap");
- }
- Roaring r;
- r.roaring = *s;
- return r;
- }
- /**
- * For advanced users.
- */
- void writeFrozen(char *buf) const noexcept {
- roaring_bitmap_frozen_serialize(&roaring, buf);
- }
- /**
- * For advanced users.
- */
- size_t getFrozenSizeInBytes() const noexcept {
- return roaring_bitmap_frozen_size_in_bytes(&roaring);
- }
- /**
- * Computes the intersection between two bitmaps and returns new bitmap.
- * The current bitmap and the provided bitmap are unchanged.
- *
- * Performance hint: if you are computing the intersection between several
- * bitmaps, two-by-two, it is best to start with the smallest bitmap.
- * Consider also using the operator &= to avoid needlessly creating
- * many temporary bitmaps.
- * This function may throw std::runtime_error.
- */
- Roaring operator&(const Roaring &o) const {
- roaring_bitmap_t *r = api::roaring_bitmap_and(&roaring, &o.roaring);
- if (r == NULL) {
- ROARING_TERMINATE("failed materalization in and");
- }
- return Roaring(r);
- }
- /**
- * Computes the difference between two bitmaps and returns new bitmap.
- * The current bitmap and the provided bitmap are unchanged.
- * This function may throw std::runtime_error.
- */
- Roaring operator-(const Roaring &o) const {
- roaring_bitmap_t *r = api::roaring_bitmap_andnot(&roaring, &o.roaring);
- if (r == NULL) {
- ROARING_TERMINATE("failed materalization in andnot");
- }
- return Roaring(r);
- }
- /**
- * Computes the union between two bitmaps and returns new bitmap.
- * The current bitmap and the provided bitmap are unchanged.
- * This function may throw std::runtime_error.
- */
- Roaring operator|(const Roaring &o) const {
- roaring_bitmap_t *r = api::roaring_bitmap_or(&roaring, &o.roaring);
- if (r == NULL) {
- ROARING_TERMINATE("failed materalization in or");
- }
- return Roaring(r);
- }
- /**
- * Computes the symmetric union between two bitmaps and returns new bitmap.
- * The current bitmap and the provided bitmap are unchanged.
- * This function may throw std::runtime_error.
- */
- Roaring operator^(const Roaring &o) const {
- roaring_bitmap_t *r = api::roaring_bitmap_xor(&roaring, &o.roaring);
- if (r == NULL) {
- ROARING_TERMINATE("failed materalization in xor");
- }
- return Roaring(r);
- }
- /**
- * Whether or not we apply copy and write.
- */
- void setCopyOnWrite(bool val) noexcept {
- api::roaring_bitmap_set_copy_on_write(&roaring, val);
- }
- /**
- * Print the content of the bitmap
- */
- void printf() const noexcept { api::roaring_bitmap_printf(&roaring); }
- /**
- * Print the content of the bitmap into a string
- */
- std::string toString() const noexcept {
- struct iter_data {
- std::string str{}; // The empty constructor silences warnings from
- // pedantic static analyzers.
- char first_char = '{';
- } outer_iter_data;
- if (!isEmpty()) {
- iterate(
- [](uint32_t value, void *inner_iter_data) -> bool {
- ((iter_data *)inner_iter_data)->str +=
- ((iter_data *)inner_iter_data)->first_char;
- ((iter_data *)inner_iter_data)->str +=
- std::to_string(value);
- ((iter_data *)inner_iter_data)->first_char = ',';
- return true;
- },
- (void *)&outer_iter_data);
- } else
- outer_iter_data.str = '{';
- outer_iter_data.str += '}';
- return outer_iter_data.str;
- }
- /**
- * Whether or not copy and write is active.
- */
- bool getCopyOnWrite() const noexcept {
- return api::roaring_bitmap_get_copy_on_write(&roaring);
- }
- /**
- * Computes the logical or (union) between "n" bitmaps (referenced by a
- * pointer).
- * This function may throw std::runtime_error.
- */
- static Roaring fastunion(size_t n, const Roaring **inputs) {
- const roaring_bitmap_t **x = (const roaring_bitmap_t **)roaring_malloc(
- n * sizeof(roaring_bitmap_t *));
- if (x == NULL) {
- ROARING_TERMINATE("failed memory alloc in fastunion");
- }
- for (size_t k = 0; k < n; ++k) x[k] = &inputs[k]->roaring;
- roaring_bitmap_t *c_ans = api::roaring_bitmap_or_many(n, x);
- if (c_ans == NULL) {
- roaring_free(x);
- ROARING_TERMINATE("failed memory alloc in fastunion");
- }
- Roaring ans(c_ans);
- roaring_free(x);
- return ans;
- }
- /**
- * Destructor. By contract, calling roaring_bitmap_clear() is enough to
- * release all auxiliary memory used by the structure.
- */
- ~Roaring() {
- if (!(roaring.high_low_container.flags & ROARING_FLAG_FROZEN)) {
- api::roaring_bitmap_clear(&roaring);
- } else {
- // The roaring member variable copies the `roaring_bitmap_t` and
- // nested `roaring_array_t` structures by value and is freed in the
- // constructor, however the underlying memory arena used for the
- // container data is not freed with it. Here we derive the arena
- // pointer from the second arena allocation in
- // `roaring_bitmap_frozen_view` and free it as well.
- roaring_bitmap_free(
- (roaring_bitmap_t *)((char *)
- roaring.high_low_container.containers -
- sizeof(roaring_bitmap_t)));
- }
- }
- friend class RoaringSetBitBiDirectionalIterator;
- typedef RoaringSetBitBiDirectionalIterator const_iterator;
- typedef RoaringSetBitBiDirectionalIterator const_bidirectional_iterator;
- /**
- * Returns an iterator that can be used to access the position of the set
- * bits. The running time complexity of a full scan is proportional to the
- * number of set bits: be aware that if you have long strings of 1s, this
- * can be very inefficient.
- *
- * It can be much faster to use the toArray method if you want to retrieve
- * the set bits.
- */
- const_iterator begin() const;
- /**
- * A bogus iterator that can be used together with begin()
- * for constructions such as for (auto i = b.begin(); * i!=b.end(); ++i) {}
- */
- const_iterator &end() const;
- roaring_bitmap_t roaring;
- };
- /**
- * Used to go through the set bits. Not optimally fast, but convenient.
- */
- class RoaringSetBitBiDirectionalIterator final {
- public:
- typedef std::bidirectional_iterator_tag iterator_category;
- typedef uint32_t *pointer;
- typedef uint32_t &reference_type;
- typedef uint32_t value_type;
- typedef int32_t difference_type;
- typedef RoaringSetBitBiDirectionalIterator type_of_iterator;
- explicit RoaringSetBitBiDirectionalIterator(const Roaring &parent,
- bool exhausted = false) {
- if (exhausted) {
- i.parent = &parent.roaring;
- i.container_index = INT32_MAX;
- i.has_value = false;
- i.current_value = UINT32_MAX;
- } else {
- api::roaring_iterator_init(&parent.roaring, &i);
- }
- }
- /**
- * Provides the location of the set bit.
- */
- value_type operator*() const { return i.current_value; }
- bool operator<(const type_of_iterator &o) const {
- if (!i.has_value) return false;
- if (!o.i.has_value) return true;
- return i.current_value < *o;
- }
- bool operator<=(const type_of_iterator &o) const {
- if (!o.i.has_value) return true;
- if (!i.has_value) return false;
- return i.current_value <= *o;
- }
- bool operator>(const type_of_iterator &o) const {
- if (!o.i.has_value) return false;
- if (!i.has_value) return true;
- return i.current_value > *o;
- }
- bool operator>=(const type_of_iterator &o) const {
- if (!i.has_value) return true;
- if (!o.i.has_value) return false;
- return i.current_value >= *o;
- }
- type_of_iterator &operator++() { // ++i, must returned inc. value
- api::roaring_uint32_iterator_advance(&i);
- return *this;
- }
- type_of_iterator operator++(int) { // i++, must return orig. value
- RoaringSetBitBiDirectionalIterator orig(*this);
- api::roaring_uint32_iterator_advance(&i);
- return orig;
- }
- /**
- * Move the iterator to the first value >= val.
- * Return true if there is such a value.
- */
- bool move_equalorlarger(value_type val) {
- return api::roaring_uint32_iterator_move_equalorlarger(&i, val);
- }
- /** DEPRECATED, use `move_equalorlarger`.*/
- CROARING_DEPRECATED void equalorlarger(uint32_t val) {
- api::roaring_uint32_iterator_move_equalorlarger(&i, val);
- }
- type_of_iterator &operator--() { // prefix --
- api::roaring_uint32_iterator_previous(&i);
- return *this;
- }
- type_of_iterator operator--(int) { // postfix --
- RoaringSetBitBiDirectionalIterator orig(*this);
- api::roaring_uint32_iterator_previous(&i);
- return orig;
- }
- bool operator==(const RoaringSetBitBiDirectionalIterator &o) const {
- return i.current_value == *o && i.has_value == o.i.has_value;
- }
- bool operator!=(const RoaringSetBitBiDirectionalIterator &o) const {
- return i.current_value != *o || i.has_value != o.i.has_value;
- }
- api::roaring_uint32_iterator_t
- i{}; // The empty constructor silences warnings from pedantic static
- // analyzers.
- };
- inline RoaringSetBitBiDirectionalIterator Roaring::begin() const {
- return RoaringSetBitBiDirectionalIterator(*this);
- }
- inline RoaringSetBitBiDirectionalIterator &Roaring::end() const {
- static RoaringSetBitBiDirectionalIterator e(*this, true);
- return e;
- }
- } // namespace roaring
- #endif /* INCLUDE_ROARING_HH_ */
|