12#include <seqan3/contrib/sdsl-lite.hpp>
84template <data_layout data_layout_mode_ = data_layout::uncompressed>
89 template <data_layout data_layout_mode>
95 seqan3::contrib::sdsl::bit_vector,
96 seqan3::contrib::sdsl::sd_vector<>>;
108 13'043'817'825'332'782'213ULL,
109 10'650'232'656'628'343'401ULL,
110 16'499'269'484'942'379'435ULL,
111 4'893'150'838'803'335'377ULL};
124 h *= 11'400'714'819'323'198'485ULL;
126#ifdef __SIZEOF_INT128__
127 h =
static_cast<uint64_t
>((
static_cast<__uint128_t
>(h) *
static_cast<__uint128_t
>(
size_in_bits)) >> 64);
167 throw std::logic_error{
"The number of hash functions must be > 0 and <= 5."};
191 data = seqan3::contrib::sdsl::sd_vector<>{bf.data};
215 assert(idx <
data.size());
235 seqan3::contrib::sdsl::util::_set_zero_bits(
data);
258 assert(idx <
data.size());
284 template <std::ranges::range value_range_t>
285 size_t count(value_range_t && values)
const noexcept
287 static_assert(std::ranges::input_range<value_range_t>,
"The values must model input_range.");
288 static_assert(std::unsigned_integral<std::ranges::range_value_t<value_range_t>>,
289 "An individual value must be an unsigned integral.");
293 for (
auto && value : values)
330 return std::tie(lhs.size_in_bits, lhs.hash_shift, lhs.hash_funs, lhs.data)
331 ==
std::tie(rhs.size_in_bits, rhs.hash_shift, rhs.hash_funs, rhs.data);
341 return !(lhs == rhs);
374 template <cereal_archive archive_t>
Provides strong types for the (Interleaved) Bloom Filter.
Adaptions of concepts from the Cereal library.
The Bloom Filter. A data structure that efficiently answers set-membership queries.
Definition bloom_filter.hpp:86
size_t size_in_bits
The size of the underlying bit vector in bits.
Definition bloom_filter.hpp:99
friend bool operator!=(bloom_filter const &lhs, bloom_filter const &rhs) noexcept
Test for inequality.
Definition bloom_filter.hpp:339
constexpr data_type & raw_data() noexcept
Provides direct, unsafe access to the underlying data structure.
Definition bloom_filter.hpp:355
size_t hash_shift
The number of bits to shift the hash value before doing multiplicative hashing.
Definition bloom_filter.hpp:101
bloom_filter(bloom_filter &&)=default
Defaulted.
static constexpr data_layout data_layout_mode
Indicates whether the Bloom Filter is compressed.
Definition bloom_filter.hpp:136
static constexpr std::array< size_t, 5 > hash_seeds
Precalculated seeds for multiplicative hashing. We use large irrational numbers for a uniform hashing...
Definition bloom_filter.hpp:107
constexpr data_type const & raw_data() const noexcept
Provides direct, unsafe access to the underlying data structure.
Definition bloom_filter.hpp:361
bloom_filter & operator=(bloom_filter const &)=default
Defaulted.
bool contains(size_t const value) const noexcept
Check whether a value is present in the Bloom Filter.
Definition bloom_filter.hpp:253
bloom_filter(bloom_filter< data_layout::uncompressed > const &bf)
Construct a compressed Bloom Filter.
Definition bloom_filter.hpp:186
constexpr size_t hash_and_fit(size_t h, size_t const seed) const
Perturbs a value and fits it into the vector.
Definition bloom_filter.hpp:120
data_type data
The bitvector.
Definition bloom_filter.hpp:105
friend bool operator==(bloom_filter const &lhs, bloom_filter const &rhs) noexcept
Test for equality.
Definition bloom_filter.hpp:328
size_t hash_funs
The number of hash functions.
Definition bloom_filter.hpp:103
void reset() noexcept
Remove all values from the Bloom Filter by setting all bits to 0.
Definition bloom_filter.hpp:232
bloom_filter(bloom_filter const &)=default
Defaulted.
size_t hash_function_count() const noexcept
Returns the number of hash functions used in the Bloom Filter.
Definition bloom_filter.hpp:306
size_t count(value_range_t &&values) const noexcept
Counts the occurrences for all values in a range.
Definition bloom_filter.hpp:285
bloom_filter()=default
Defaulted.
size_t bit_size() const noexcept
Returns the size of the underlying bitvector.
Definition bloom_filter.hpp:314
bloom_filter & operator=(bloom_filter &&)=default
Defaulted.
void emplace(size_t const value) noexcept
Inserts a value into the Bloom Filter.
Definition bloom_filter.hpp:209
~bloom_filter()=default
Defaulted.
bloom_filter(seqan3::bin_size size, seqan3::hash_function_count funs=seqan3::hash_function_count{2u})
Construct an uncompressed Bloom Filter.
Definition bloom_filter.hpp:160
data_layout
Determines if the Interleaved Bloom Filter is compressed.
Definition bloom_filter_strong_types.hpp:23
@ uncompressed
The Interleaved Bloom Filter is uncompressed.
Definition bloom_filter_strong_types.hpp:24
@ compressed
The Interleaved Bloom Filter is compressed.
Definition bloom_filter_strong_types.hpp:25
The main SeqAn3 namespace.
Definition aligned_sequence_concept.hpp:26
A strong type that represents the number of bits for each bin in the seqan3::interleaved_bloom_filter...
Definition bloom_filter_strong_types.hpp:38
A strong type that represents the number of hash functions for the seqan3::interleaved_bloom_filter.
Definition bloom_filter_strong_types.hpp:45
strong_type for seed.
Definition minimiser_hash.hpp:22