diff --git a/Cargo.lock b/Cargo.lock index b84ae4d..4f45afa 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -176,7 +176,7 @@ dependencies = [ [[package]] name = "croaring" -version = "2.0.0" +version = "2.0.1" dependencies = [ "criterion", "croaring-sys", diff --git a/croaring-sys/CRoaring/bindgen_bundled_version.rs b/croaring-sys/CRoaring/bindgen_bundled_version.rs index 2cb2d5b..d8da1ef 100644 --- a/croaring-sys/CRoaring/bindgen_bundled_version.rs +++ b/croaring-sys/CRoaring/bindgen_bundled_version.rs @@ -1,9 +1,9 @@ /* automatically generated by rust-bindgen 0.69.4 */ -pub const ROARING_VERSION: &[u8; 6] = b"3.0.1\0"; -pub const ROARING_VERSION_MAJOR: _bindgen_ty_1 = 3; +pub const ROARING_VERSION: &[u8; 6] = b"4.0.0\0"; +pub const ROARING_VERSION_MAJOR: _bindgen_ty_1 = 4; pub const ROARING_VERSION_MINOR: _bindgen_ty_1 = 0; -pub const ROARING_VERSION_REVISION: _bindgen_ty_1 = 1; +pub const ROARING_VERSION_REVISION: _bindgen_ty_1 = 0; pub type _bindgen_ty_1 = ::core::ffi::c_uint; #[doc = " Roaring arrays are array-based key-value pairs having containers as values\n and 16-bit integer keys. A roaring bitmap might be implemented as such."] #[repr(C)] @@ -45,6 +45,26 @@ pub struct roaring_statistics_s { } #[doc = " (For advanced users.)\n The roaring_statistics_t can be used to collect detailed statistics about\n the composition of a roaring bitmap."] pub type roaring_statistics_t = roaring_statistics_s; +#[doc = " (For advanced users.)\n The roaring64_statistics_t can be used to collect detailed statistics about\n the composition of a roaring64 bitmap."] +#[repr(C)] +#[derive(Debug, Copy, Clone)] +pub struct roaring64_statistics_s { + pub n_containers: u64, + pub n_array_containers: u64, + pub n_run_containers: u64, + pub n_bitset_containers: u64, + pub n_values_array_containers: u64, + pub n_values_run_containers: u64, + pub n_values_bitset_containers: u64, + pub n_bytes_array_containers: u64, + pub n_bytes_run_containers: u64, + pub n_bytes_bitset_containers: u64, + pub max_value: u64, + pub min_value: u64, + pub cardinality: u64, +} +#[doc = " (For advanced users.)\n The roaring64_statistics_t can be used to collect detailed statistics about\n the composition of a roaring64 bitmap."] +pub type roaring64_statistics_t = roaring64_statistics_s; #[doc = " Roaring-internal type used to iterate within a roaring container."] #[repr(C)] #[derive(Debug, Copy, Clone)] @@ -973,6 +993,13 @@ extern "C" { #[doc = " Returns true if the result has at least one run container."] pub fn roaring64_bitmap_run_optimize(r: *mut roaring64_bitmap_t) -> bool; } +extern "C" { + #[doc = " (For advanced users.)\n Collect statistics about the bitmap"] + pub fn roaring64_bitmap_statistics( + r: *const roaring64_bitmap_t, + stat: *mut roaring64_statistics_t, + ); +} extern "C" { #[doc = " Perform internal consistency checks.\n\n Returns true if the bitmap is consistent. It may be useful to call this\n after deserializing bitmaps from untrusted sources. If\n roaring64_bitmap_internal_validate returns true, then the bitmap is\n consistent and can be trusted not to cause crashes or memory corruption.\n\n If reason is non-null, it will be set to a string describing the first\n inconsistency found if any."] pub fn roaring64_bitmap_internal_validate( diff --git a/croaring-sys/CRoaring/roaring.c b/croaring-sys/CRoaring/roaring.c index 7385cff..6c6f58d 100644 --- a/croaring-sys/CRoaring/roaring.c +++ b/croaring-sys/CRoaring/roaring.c @@ -1,5 +1,5 @@ // !!! DO NOT EDIT - THIS IS AN AUTO-GENERATED FILE !!! -// Created by amalgamation.sh on 2024-04-02T13:42:32Z +// Created by amalgamation.sh on 2024-05-13T21:29:25Z /* * The CRoaring project is under a dual license (Apache/MIT). @@ -10141,7 +10141,7 @@ static art_indexed_child_t art_node_next_child(const art_node_t *node, return art_node256_next_child((art_node256_t *)node, index); default: assert(false); - return (art_indexed_child_t){0}; + return (art_indexed_child_t){0, 0, 0}; } } @@ -10165,7 +10165,7 @@ static art_indexed_child_t art_node_prev_child(const art_node_t *node, return art_node256_prev_child((art_node256_t *)node, index); default: assert(false); - return (art_indexed_child_t){0}; + return (art_indexed_child_t){0, 0, 0}; } } @@ -10189,7 +10189,7 @@ static art_indexed_child_t art_node_child_at(const art_node_t *node, return art_node256_child_at((art_node256_t *)node, index); default: assert(false); - return (art_indexed_child_t){0}; + return (art_indexed_child_t){0, 0, 0}; } } @@ -10213,7 +10213,7 @@ static art_indexed_child_t art_node_lower_bound(const art_node_t *node, return art_node256_lower_bound((art_node256_t *)node, key_chunk); default: assert(false); - return (art_indexed_child_t){0}; + return (art_indexed_child_t){0, 0, 0}; } } @@ -10770,7 +10770,7 @@ static bool art_node_iterator_lower_bound(const art_node_t *node, } art_iterator_t art_init_iterator(const art_t *art, bool first) { - art_iterator_t iterator = {0}; + art_iterator_t iterator = {0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0}; if (art->root == NULL) { return iterator; } @@ -10827,7 +10827,7 @@ bool art_iterator_lower_bound(art_iterator_t *iterator, } art_iterator_t art_lower_bound(const art_t *art, const art_key_chunk_t *key) { - art_iterator_t iterator = {0}; + art_iterator_t iterator = {0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0}; if (art->root != NULL) { art_node_iterator_lower_bound(art->root, &iterator, key); } @@ -10835,7 +10835,7 @@ art_iterator_t art_lower_bound(const art_t *art, const art_key_chunk_t *key) { } art_iterator_t art_upper_bound(const art_t *art, const art_key_chunk_t *key) { - art_iterator_t iterator = {0}; + art_iterator_t iterator = {0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0}; if (art->root != NULL) { if (art_node_iterator_lower_bound(art->root, &iterator, key) && art_compare_keys(iterator.key, key) == 0) { @@ -19469,7 +19469,7 @@ roaring_bitmap_t *roaring_bitmap_of(size_t n_args, ...) { // todo: could be greatly optimized but we do not expect this call to ever // include long lists roaring_bitmap_t *answer = roaring_bitmap_create(); - roaring_bulk_context_t context = {0}; + roaring_bulk_context_t context = {0, 0, 0, 0}; va_list ap; va_start(ap, n_args); for (size_t i = 0; i < n_args; i++) { @@ -19641,20 +19641,6 @@ void roaring_bitmap_printf_describe(const roaring_bitmap_t *r) { printf("}"); } -typedef struct min_max_sum_s { - uint32_t min; - uint32_t max; - uint64_t sum; -} min_max_sum_t; - -static bool min_max_sum_fnc(uint32_t value, void *param) { - min_max_sum_t *mms = (min_max_sum_t *)param; - if (value > mms->max) mms->max = value; - if (value < mms->min) mms->min = value; - mms->sum += value; - return true; // we always process all data points -} - /** * (For advanced users.) * Collect statistics about the bitmap @@ -19665,15 +19651,8 @@ void roaring_bitmap_statistics(const roaring_bitmap_t *r, memset(stat, 0, sizeof(*stat)); stat->n_containers = ra->size; - stat->cardinality = roaring_bitmap_get_cardinality(r); - min_max_sum_t mms; - mms.min = UINT32_C(0xFFFFFFFF); - mms.max = UINT32_C(0); - mms.sum = 0; - roaring_iterate(r, &min_max_sum_fnc, &mms); - stat->min_value = mms.min; - stat->max_value = mms.max; - stat->sum_value = mms.sum; + stat->min_value = roaring_bitmap_minimum(r); + stat->max_value = roaring_bitmap_maximum(r); for (int i = 0; i < ra->size; ++i) { uint8_t truetype = @@ -19682,6 +19661,7 @@ void roaring_bitmap_statistics(const roaring_bitmap_t *r, container_get_cardinality(ra->containers[i], ra->typecodes[i]); uint32_t sbytes = container_size_in_bytes(ra->containers[i], ra->typecodes[i]); + stat->cardinality += card; switch (truetype) { case BITSET_CONTAINER_TYPE: stat->n_bitset_containers++; @@ -20831,7 +20811,7 @@ roaring_bitmap_t *roaring_bitmap_deserialize(const void *buf) { if (bitmap == NULL) { return NULL; } - roaring_bulk_context_t context = {0}; + roaring_bulk_context_t context = {0, 0, 0, 0}; for (uint32_t i = 0; i < card; i++) { // elems may not be aligned, read with memcpy uint32_t elem; @@ -20874,7 +20854,7 @@ roaring_bitmap_t *roaring_bitmap_deserialize_safe(const void *buf, if (bitmap == NULL) { return NULL; } - roaring_bulk_context_t context = {0}; + roaring_bulk_context_t context = {0, 0, 0, 0}; for (uint32_t i = 0; i < card; i++) { // elems may not be aligned, read with memcpy uint32_t elem; @@ -22876,7 +22856,7 @@ roaring64_bitmap_t *roaring64_bitmap_of_ptr(size_t n_args, roaring64_bitmap_t *roaring64_bitmap_of(size_t n_args, ...) { roaring64_bitmap_t *r = roaring64_bitmap_create(); - roaring64_bulk_context_t context = {0}; + roaring64_bulk_context_t context = {0, 0, 0, 0, 0, 0, 0}; va_list ap; va_start(ap, n_args); for (size_t i = 0; i < n_args; i++) { @@ -22969,7 +22949,7 @@ void roaring64_bitmap_add_many(roaring64_bitmap_t *r, size_t n_args, return; } const uint64_t *end = vals + n_args; - roaring64_bulk_context_t context = {0}; + roaring64_bulk_context_t context = {0, 0, 0, 0, 0, 0, 0}; for (const uint64_t *current_val = vals; current_val != end; current_val++) { roaring64_bitmap_add_bulk(r, &context, *current_val); @@ -23108,7 +23088,8 @@ bool roaring64_bitmap_contains_bulk(const roaring64_bitmap_t *r, uint8_t high48[ART_KEY_BYTES]; uint16_t low16 = split_key(val, high48); - if (context->leaf == NULL || context->high_bytes != high48) { + if (context->leaf == NULL || + art_compare_keys(context->high_bytes, high48) != 0) { // We're not positioned anywhere yet or the high bits of the key // differ. leaf_t *leaf = (leaf_t *)art_find(&r->art, high48); @@ -23292,7 +23273,7 @@ void roaring64_bitmap_remove_many(roaring64_bitmap_t *r, size_t n_args, return; } const uint64_t *end = vals + n_args; - roaring64_bulk_context_t context = {0}; + roaring64_bulk_context_t context = {0, 0, 0, 0, 0, 0, 0}; for (const uint64_t *current_val = vals; current_val != end; current_val++) { roaring64_bitmap_remove_bulk(r, &context, *current_val); @@ -23455,6 +23436,50 @@ bool roaring64_bitmap_run_optimize(roaring64_bitmap_t *r) { return has_run_container; } +/** + * (For advanced users.) + * Collect statistics about the bitmap + */ +void roaring64_bitmap_statistics(const roaring64_bitmap_t *r, + roaring64_statistics_t *stat) { + memset(stat, 0, sizeof(*stat)); + stat->min_value = roaring64_bitmap_minimum(r); + stat->max_value = roaring64_bitmap_maximum(r); + + art_iterator_t it = art_init_iterator(&r->art, true); + while (it.value != NULL) { + leaf_t *leaf = (leaf_t *)it.value; + stat->n_containers++; + uint8_t truetype = get_container_type(leaf->container, leaf->typecode); + uint32_t card = + container_get_cardinality(leaf->container, leaf->typecode); + uint32_t sbytes = + container_size_in_bytes(leaf->container, leaf->typecode); + stat->cardinality += card; + switch (truetype) { + case BITSET_CONTAINER_TYPE: + stat->n_bitset_containers++; + stat->n_values_bitset_containers += card; + stat->n_bytes_bitset_containers += sbytes; + break; + case ARRAY_CONTAINER_TYPE: + stat->n_array_containers++; + stat->n_values_array_containers += card; + stat->n_bytes_array_containers += sbytes; + break; + case RUN_CONTAINER_TYPE: + stat->n_run_containers++; + stat->n_values_run_containers += card; + stat->n_bytes_run_containers += sbytes; + break; + default: + assert(false); + roaring_unreachable; + } + art_iterator_next(&it); + } +} + static bool roaring64_leaf_internal_validate(const art_val_t *val, const char **reason) { leaf_t *leaf = (leaf_t *)val; @@ -24576,7 +24601,7 @@ bool roaring64_bitmap_iterate(const roaring64_bitmap_t *r, void roaring64_bitmap_to_uint64_array(const roaring64_bitmap_t *r, uint64_t *out) { - roaring64_iterator_t it = {0}; + roaring64_iterator_t it; // gets initialized in the next line roaring64_iterator_init_at(r, &it, /*first=*/true); roaring64_iterator_read(&it, out, UINT64_MAX); } diff --git a/croaring-sys/CRoaring/roaring.h b/croaring-sys/CRoaring/roaring.h index ffef052..c0d9a52 100644 --- a/croaring-sys/CRoaring/roaring.h +++ b/croaring-sys/CRoaring/roaring.h @@ -1,5 +1,5 @@ // !!! DO NOT EDIT - THIS IS AN AUTO-GENERATED FILE !!! -// Created by amalgamation.sh on 2024-04-02T13:42:32Z +// Created by amalgamation.sh on 2024-05-13T21:29:25Z /* * The CRoaring project is under a dual license (Apache/MIT). @@ -59,11 +59,11 @@ // /include/roaring/roaring_version.h automatically generated by release.py, do not change by hand #ifndef ROARING_INCLUDE_ROARING_VERSION #define ROARING_INCLUDE_ROARING_VERSION -#define ROARING_VERSION "3.0.1" +#define ROARING_VERSION "4.0.0" enum { - ROARING_VERSION_MAJOR = 3, + ROARING_VERSION_MAJOR = 4, ROARING_VERSION_MINOR = 0, - ROARING_VERSION_REVISION = 1 + ROARING_VERSION_REVISION = 0 }; #endif // ROARING_INCLUDE_ROARING_VERSION // clang-format on/* end file include/roaring/roaring_version.h */ @@ -159,14 +159,48 @@ typedef struct roaring_statistics_s { max_value; /* the maximal value, undefined if cardinality is zero */ uint32_t min_value; /* the minimal value, undefined if cardinality is zero */ - uint64_t sum_value; /* the sum of all values (could be used to compute - average) */ + uint64_t sum_value; /* deprecated always zero */ uint64_t cardinality; /* total number of values stored in the bitmap */ // and n_values_arrays, n_values_rle, n_values_bitmap } roaring_statistics_t; +/** + * (For advanced users.) + * The roaring64_statistics_t can be used to collect detailed statistics about + * the composition of a roaring64 bitmap. + */ +typedef struct roaring64_statistics_s { + uint64_t n_containers; /* number of containers */ + + uint64_t n_array_containers; /* number of array containers */ + uint64_t n_run_containers; /* number of run containers */ + uint64_t n_bitset_containers; /* number of bitmap containers */ + + uint64_t + n_values_array_containers; /* number of values in array containers */ + uint64_t n_values_run_containers; /* number of values in run containers */ + uint64_t + n_values_bitset_containers; /* number of values in bitmap containers */ + + uint64_t n_bytes_array_containers; /* number of allocated bytes in array + containers */ + uint64_t n_bytes_run_containers; /* number of allocated bytes in run + containers */ + uint64_t n_bytes_bitset_containers; /* number of allocated bytes in bitmap + containers */ + + uint64_t + max_value; /* the maximal value, undefined if cardinality is zero */ + uint64_t + min_value; /* the minimal value, undefined if cardinality is zero */ + + uint64_t cardinality; /* total number of values stored in the bitmap */ + + // and n_values_arrays, n_values_rle, n_values_bitmap +} roaring64_statistics_t; + /** * Roaring-internal type used to iterate within a roaring container. */ @@ -2542,6 +2576,13 @@ uint64_t roaring64_bitmap_maximum(const roaring64_bitmap_t *r); */ bool roaring64_bitmap_run_optimize(roaring64_bitmap_t *r); +/** + * (For advanced users.) + * Collect statistics about the bitmap + */ +void roaring64_bitmap_statistics(const roaring64_bitmap_t *r, + roaring64_statistics_t *stat); + /** * Perform internal consistency checks. * diff --git a/croaring-sys/CRoaring/roaring.hh b/croaring-sys/CRoaring/roaring.hh index a8f4fad..1881de5 100644 --- a/croaring-sys/CRoaring/roaring.hh +++ b/croaring-sys/CRoaring/roaring.hh @@ -1,5 +1,5 @@ // !!! DO NOT EDIT - THIS IS AN AUTO-GENERATED FILE !!! -// Created by amalgamation.sh on 2024-04-02T13:42:32Z +// Created by amalgamation.sh on 2024-05-13T21:29:25Z /* * The CRoaring project is under a dual license (Apache/MIT). diff --git a/croaring/Cargo.toml b/croaring/Cargo.toml index a135dc5..df42cfd 100644 --- a/croaring/Cargo.toml +++ b/croaring/Cargo.toml @@ -1,6 +1,6 @@ [package] name = "croaring" -version = "2.0.0" +version = "2.0.1" edition = "2021" authors = ["croaring-rs developers"] license = "Apache-2.0" diff --git a/croaring/src/bitmap/imp.rs b/croaring/src/bitmap/imp.rs index f6f7b57..e07ac7f 100644 --- a/croaring/src/bitmap/imp.rs +++ b/croaring/src/bitmap/imp.rs @@ -24,7 +24,7 @@ impl Bitmap { // (it can be moved safely), and can be freed with `free`, without freeing the underlying // containers and auxiliary data. Ensure this is still valid every time we update // the version of croaring. - const _: () = assert!(ffi::ROARING_VERSION_MAJOR == 3 && ffi::ROARING_VERSION_MINOR == 0); + const _: () = assert!(ffi::ROARING_VERSION_MAJOR == 4 && ffi::ROARING_VERSION_MINOR == 0); ffi::roaring_free(p.cast::()); result } @@ -1534,7 +1534,6 @@ impl Bitmap { /// assert_eq!(statistics.n_bytes_bitset_containers, 0); /// assert_eq!(statistics.max_value, 99); /// assert_eq!(statistics.min_value, 1); - /// assert_eq!(statistics.sum_value, 4950); /// assert_eq!(statistics.cardinality, 99); /// /// bitmap.run_optimize(); @@ -1552,18 +1551,50 @@ impl Bitmap { /// assert_eq!(statistics.n_bytes_bitset_containers, 0); /// assert_eq!(statistics.max_value, 99); /// assert_eq!(statistics.min_value, 1); - /// assert_eq!(statistics.sum_value, 4950); /// assert_eq!(statistics.cardinality, 99); /// ``` #[inline] #[doc(alias = "roaring_bitmap_statistics")] #[must_use] pub fn statistics(&self) -> Statistics { - let mut statistics: ffi::roaring_statistics_s = unsafe { mem::zeroed() }; - - unsafe { ffi::roaring_bitmap_statistics(&self.bitmap, &mut statistics) }; - - statistics + let mut statistics = mem::MaybeUninit::zeroed(); + + unsafe { ffi::roaring_bitmap_statistics(&self.bitmap, statistics.as_mut_ptr()) }; + + // Exhaustively extract the fields to ensure we don't miss any if they're added + let ffi::roaring_statistics_t { + n_containers, + n_array_containers, + n_run_containers, + n_bitset_containers, + n_values_array_containers, + n_values_run_containers, + n_values_bitset_containers, + n_bytes_array_containers, + n_bytes_run_containers, + n_bytes_bitset_containers, + max_value, + min_value, + // sum_value is deprecated and always zero + sum_value: _sum_value, + cardinality, + } = unsafe { statistics.assume_init() }; + + Statistics { + n_containers, + n_array_containers, + n_run_containers, + n_bitset_containers, + n_values_array_containers, + n_values_run_containers, + n_values_bitset_containers, + n_bytes_array_containers, + n_bytes_run_containers, + n_bytes_bitset_containers, + max_value, + min_value, + cardinality, + } } /// Store the bitmap to a bitset diff --git a/croaring/src/bitmap/mod.rs b/croaring/src/bitmap/mod.rs index 6e4aa17..417c04a 100644 --- a/croaring/src/bitmap/mod.rs +++ b/croaring/src/bitmap/mod.rs @@ -87,7 +87,40 @@ unsafe impl<'a> Sync for BitmapView<'a> {} unsafe impl<'a> Send for BitmapView<'a> {} /// Detailed statistics on the composition of a bitmap -pub type Statistics = ffi::roaring_statistics_s; +/// +/// See [`Bitmap::statistics`] for more information +#[derive(Debug, Copy, Clone, PartialEq, Eq, Default)] +pub struct Statistics { + /// Number of containers in the bitmap + pub n_containers: u32, + /// Number of array containers in the bitmap + pub n_array_containers: u32, + /// Number of run containers in the bitmap + pub n_run_containers: u32, + /// Number of bitset containers in the bitmap + pub n_bitset_containers: u32, + /// Number of values stored in array containers + pub n_values_array_containers: u32, + /// Number of values stored in run containers + pub n_values_run_containers: u32, + /// Number of values stored in bitset containers + pub n_values_bitset_containers: u32, + /// Number of bytes used by array containers + pub n_bytes_array_containers: u32, + /// Number of bytes used by run containers + pub n_bytes_run_containers: u32, + /// Number of bytes used by bitset containers + pub n_bytes_bitset_containers: u32, + /// Maximum value stored in the bitmap + pub max_value: u32, + /// Minimum value stored in the bitmap + pub min_value: u32, + /// Number of values stored in the bitmap + pub cardinality: u64, + // NOTE: This has every field as the roaring_statistics_t struct in CRoaring, + // except for the sum_value, which is deprecated and always zero since + // CRoaring 4.0.0 +} mod imp; mod iter; diff --git a/croaring/src/bitmap/ops.rs b/croaring/src/bitmap/ops.rs index 6d9a1be..f62b64f 100644 --- a/croaring/src/bitmap/ops.rs +++ b/croaring/src/bitmap/ops.rs @@ -138,7 +138,7 @@ impl Drop for Bitmap { fn drop(&mut self) { // This depends somewhat heavily on the implementation of croaring, // Ensure this is still valid every time we update the version of croaring. - const _: () = assert!(ffi::ROARING_VERSION_MAJOR == 3 && ffi::ROARING_VERSION_MINOR == 0); + const _: () = assert!(ffi::ROARING_VERSION_MAJOR == 4 && ffi::ROARING_VERSION_MINOR == 0); // Per https://github.com/RoaringBitmap/CRoaring/blob/4f8dbdb0cc884626b20ef0cc9e891f701fe157cf/cpp/roaring.hh#L182 // > By contract, calling roaring_bitmap_clear() is enough to diff --git a/croaring/src/bitmap/view.rs b/croaring/src/bitmap/view.rs index 1fa3ff1..73fbc43 100644 --- a/croaring/src/bitmap/view.rs +++ b/croaring/src/bitmap/view.rs @@ -27,7 +27,7 @@ impl<'a> BitmapView<'a> { // `containers` array is stored immediately after the roaring_bitmap_t data. // Ensure this is still valid every time we update // the version of croaring. - const _: () = assert!(ffi::ROARING_VERSION_MAJOR == 3 && ffi::ROARING_VERSION_MINOR == 0); + const _: () = assert!(ffi::ROARING_VERSION_MAJOR == 4 && ffi::ROARING_VERSION_MINOR == 0); assert!(!p.is_null()); diff --git a/croaring/src/bitmap64/imp.rs b/croaring/src/bitmap64/imp.rs index f12865a..21c0cec 100644 --- a/croaring/src/bitmap64/imp.rs +++ b/croaring/src/bitmap64/imp.rs @@ -1,5 +1,4 @@ -use crate::bitmap64::Bitmap64; -use crate::bitmap64::{Deserializer, Serializer}; +use super::{Bitmap64, Deserializer, Serializer, Statistics}; use core::mem::MaybeUninit; use core::ops::{Bound, RangeBounds}; use core::prelude::v1::*; @@ -947,6 +946,58 @@ impl Bitmap64 { } } + /// Returns statistics about the composition of a roaring bitmap64. + /// + /// # Examples + /// + /// ``` + /// use croaring::Bitmap64; + /// + /// let mut bitmap: Bitmap64 = (1..100).collect(); + /// let statistics = bitmap.statistics(); + /// + /// assert_eq!(statistics.n_containers, 1); + /// assert_eq!(statistics.n_array_containers, 1); + /// assert_eq!(statistics.n_run_containers, 0); + /// assert_eq!(statistics.n_bitset_containers, 0); + /// assert_eq!(statistics.n_values_array_containers, 99); + /// assert_eq!(statistics.n_values_run_containers, 0); + /// assert_eq!(statistics.n_values_bitset_containers, 0); + /// assert_eq!(statistics.n_bytes_array_containers, 198); + /// assert_eq!(statistics.n_bytes_run_containers, 0); + /// assert_eq!(statistics.n_bytes_bitset_containers, 0); + /// assert_eq!(statistics.max_value, 99); + /// assert_eq!(statistics.min_value, 1); + /// assert_eq!(statistics.cardinality, 99); + /// + /// bitmap.run_optimize(); + /// let statistics = bitmap.statistics(); + /// + /// assert_eq!(statistics.n_containers, 1); + /// assert_eq!(statistics.n_array_containers, 0); + /// assert_eq!(statistics.n_run_containers, 1); + /// assert_eq!(statistics.n_bitset_containers, 0); + /// assert_eq!(statistics.n_values_array_containers, 0); + /// assert_eq!(statistics.n_values_run_containers, 99); + /// assert_eq!(statistics.n_values_bitset_containers, 0); + /// assert_eq!(statistics.n_bytes_array_containers, 0); + /// assert_eq!(statistics.n_bytes_run_containers, 6); + /// assert_eq!(statistics.n_bytes_bitset_containers, 0); + /// assert_eq!(statistics.max_value, 99); + /// assert_eq!(statistics.min_value, 1); + /// assert_eq!(statistics.cardinality, 99); + /// ``` + #[inline] + #[doc(alias = "roaring64_bitmap_statistics")] + #[must_use] + pub fn statistics(&self) -> Statistics { + let mut stats = MaybeUninit::::zeroed(); + unsafe { + ffi::roaring64_bitmap_statistics(self.raw.as_ptr(), stats.as_mut_ptr()); + stats.assume_init() + } + } + /// Ensure the bitmap is internally valid /// /// This is useful for development, but is not needed for normal use: diff --git a/croaring/src/bitmap64/mod.rs b/croaring/src/bitmap64/mod.rs index 0b96ed5..04521b4 100644 --- a/croaring/src/bitmap64/mod.rs +++ b/croaring/src/bitmap64/mod.rs @@ -15,3 +15,8 @@ pub struct Bitmap64 { } unsafe impl Sync for Bitmap64 {} unsafe impl Send for Bitmap64 {} + +/// Detailed statistics on the composition of a bitmap +/// +/// See [`Bitmap64::statistics`] for more information +pub type Statistics = ffi::roaring64_statistics_t; diff --git a/croaring/src/bitset/imp.rs b/croaring/src/bitset/imp.rs index d29a08c..cdacd93 100644 --- a/croaring/src/bitset/imp.rs +++ b/croaring/src/bitset/imp.rs @@ -9,7 +9,7 @@ impl Bitset { let result = Self { bitset: p.read() }; // It seems unlikely that the bitset type will meaningfully change, but check if we ever go // to a version 3. - const _: () = assert!(ffi::ROARING_VERSION_MAJOR == 3); + const _: () = assert!(ffi::ROARING_VERSION_MAJOR == 4); ffi::roaring_free(p.cast()); result }