SeqAn3 3.4.0-rc.4
The Modern C++ library for sequence analysis.
All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Modules Pages Concepts
bi_fm_index_cursor.hpp
Go to the documentation of this file.
1// SPDX-FileCopyrightText: 2006-2025 Knut Reinert & Freie Universität Berlin
2// SPDX-FileCopyrightText: 2016-2025 Knut Reinert & MPI für molekulare Genetik
3// SPDX-License-Identifier: BSD-3-Clause
4
10#pragma once
11
12#include <array>
13#include <ranges>
14
18#include <seqan3/contrib/sdsl-lite.hpp>
23
24namespace seqan3
25{
26
49template <typename index_t>
51{
52public:
54 using index_type = index_t;
55
60 using size_type = typename index_type::size_type;
62
67 using fwd_cursor = fm_index_cursor<fm_index<typename index_type::alphabet_type,
68 index_type::text_layout_mode,
69 typename index_type::sdsl_index_type>>;
71
72private:
74 using sdsl_char_type = typename index_type::sdsl_char_type;
76 using sdsl_index_type = typename index_t::sdsl_index_type;
78 using sdsl_sigma_type = typename index_type::sdsl_sigma_type;
80 using index_alphabet_type = typename index_t::alphabet_type;
85
87 index_type const * index{nullptr};
88
93 size_type fwd_lb{};
95 size_type fwd_rb{};
97 size_type rev_lb{};
99 size_type rev_rb{};
100 //\}
101
103 sdsl_sigma_type sigma{};
104
111 // parent_* and _last_char only have to be stored for the (unidirectional) cursor that has been used last for
112 // extend_right() or cycle_back() resp. extend_left() or cycle_front(), (i.e. either fwd or rev). Thus there is no
113 // need to store it twice. Once the cursor is switched, the information becomes invalid anyway.
114
116 size_type parent_lb{};
118 size_type parent_rb{};
120 sdsl_char_type _last_char{};
121 //\}
122
124 size_type depth{}; // equal for both cursors. only stored once
125
126 // supports assertions to check whether cycle_back() resp. cycle_front() is called on the same direction as the last
127 // extend_right([...]) resp. extend_left([...])
128#ifndef NDEBUG
130 // cycle_back() and cycle_front()
131 bool fwd_cursor_last_used = false;
132#endif
133
135 size_type offset() const noexcept
136 {
137 assert(index->size() > query_length());
138 return index->size() - query_length() - 1; // since the string is reversed during construction
139 }
140
142 template <typename csa_t>
143 requires (std::same_as<csa_t, typename index_type::sdsl_index_type>
144 || std::same_as<csa_t, typename index_type::rev_sdsl_index_type>)
145 bool bidirectional_search(csa_t const & csa,
146 sdsl_char_type const c,
147 size_type & l_fwd,
148 size_type & r_fwd,
149 size_type & l_bwd,
150 size_type & r_bwd) const noexcept
151 {
152 assert((l_fwd <= r_fwd) && (r_fwd < csa.size()));
153 assert(r_fwd + 1 >= l_fwd);
154 assert(r_bwd + 1 - l_bwd == r_fwd + 1 - l_fwd);
155
156 size_type _l_fwd, _r_fwd, _l_bwd, _r_bwd;
157
158 size_type cc = c;
159 if constexpr (!std::same_as<index_alphabet_type, seqan3::contrib::sdsl::plain_byte_alphabet>)
160 {
161 cc = csa.char2comp[c];
162 if (cc == 0 && c > 0) // [[unlikely]]
163 return false;
164 }
165
166 size_type const c_begin = csa.C[cc];
167 if (r_fwd + 1 - l_fwd == csa.size()) // [[unlikely]]
168 {
169 _l_fwd = c_begin;
170 _l_bwd = c_begin;
171 _r_fwd = csa.C[cc + 1] - 1;
172 _r_bwd = _r_fwd;
173 // if we use not the plain_byte_alphabet, we could return always return true here
174 }
175 else
176 {
177 auto const r_s_b = csa.wavelet_tree.lex_count(l_fwd, r_fwd + 1, c);
178 size_type const rank_l = std::get<0>(r_s_b);
179 size_type const s = std::get<1>(r_s_b), b = std::get<2>(r_s_b);
180 size_type const rank_r = r_fwd - l_fwd - s - b + rank_l;
181 _l_fwd = c_begin + rank_l;
182 _r_fwd = c_begin + rank_r;
183 _l_bwd = l_bwd + s;
184 _r_bwd = r_bwd - b;
185 }
186
187 if (_r_fwd >= _l_fwd)
188 {
189 l_fwd = _l_fwd;
190 r_fwd = _r_fwd;
191 l_bwd = _l_bwd;
192 r_bwd = _r_bwd;
193 assert(r_fwd + 1 >= l_fwd);
194 assert(r_bwd + 1 - l_bwd == r_fwd + 1 - l_fwd);
195 return true;
196 }
197 return false;
198 }
199
201 template <typename csa_t>
202 requires (std::same_as<csa_t, typename index_type::sdsl_index_type>
203 || std::same_as<csa_t, typename index_type::rev_sdsl_index_type>)
204 bool bidirectional_search_cycle(csa_t const & csa,
205 sdsl_char_type const c,
206 size_type const l_parent,
207 size_type const r_parent,
208 size_type & l_fwd,
209 size_type & r_fwd,
210 size_type & l_bwd,
211 size_type & r_bwd) const noexcept
212 {
213 assert((l_parent <= r_parent) && (r_parent < csa.size()));
214
215 size_type c_begin;
216 if constexpr (std::same_as<index_alphabet_type, seqan3::contrib::sdsl::plain_byte_alphabet>)
217 c_begin = csa.C[c]; // TODO: check whether this can be removed
218 else
219 c_begin = csa.C[csa.char2comp[c]];
220
221 auto const r_s_b = csa.wavelet_tree.lex_count(l_parent, r_parent + 1, c);
222 size_type const s = std::get<1>(r_s_b), b = std::get<2>(r_s_b), rank_l = std::get<0>(r_s_b),
223 rank_r = r_parent - l_parent - s - b + rank_l;
224
225 size_type const _l_fwd = c_begin + rank_l;
226 size_type const _r_fwd = c_begin + rank_r;
227 size_type const _l_bwd = r_bwd + 1;
228 size_type const _r_bwd = r_bwd + 1 + rank_r - rank_l;
229
230 if (_r_fwd >= _l_fwd)
231 {
232 l_fwd = _l_fwd;
233 r_fwd = _r_fwd;
234 l_bwd = _l_bwd;
235 r_bwd = _r_bwd;
236 assert(r_fwd + 1 >= l_fwd);
237 assert(r_bwd + 1 - l_bwd == r_fwd + 1 - l_fwd);
238 return true;
239 }
240 return false;
241 }
242
243public:
248 // Default construction is necessary to make this class semi-regular and e.g., to allow construction of
249 // std::array of cursors.
256
259 index(&_index),
260 fwd_lb(0),
261 fwd_rb(_index.size() - 1),
262 rev_lb(0),
263 rev_rb(_index.size() - 1),
264 sigma(_index.fwd_fm.index.sigma - index_t::text_layout_mode),
265 depth(0)
266 {}
267 //\}
268
281 bool operator==(bi_fm_index_cursor const & rhs) const noexcept
282 {
283 assert(index != nullptr);
284 // equal SA interval implies equal parent node information (or both are root nodes)
285 assert(!(fwd_lb == rhs.fwd_lb && fwd_rb == rhs.fwd_rb && depth == rhs.depth) || (depth == 0)
286 || (parent_lb == rhs.parent_lb && parent_rb == rhs.parent_rb && _last_char == rhs._last_char));
287
288 return std::tie(fwd_lb, fwd_rb, depth) == std::tie(rhs.fwd_lb, rhs.fwd_rb, rhs.depth);
289 }
290
303 bool operator!=(bi_fm_index_cursor const & rhs) const noexcept
304 {
305 assert(index != nullptr);
306
307 return !(*this == rhs);
308 }
309
328 {
329#ifndef NDEBUG
330 fwd_cursor_last_used = true;
331#endif
332
333 assert(index != nullptr);
334
335 size_type new_parent_lb = fwd_lb, new_parent_rb = fwd_rb;
336
337 sdsl_sigma_type c = 1; // NOTE: start with 0 or 1 depending on implicit_sentintel
338 while (c < sigma
339 && !bidirectional_search(index->fwd_fm.index,
340 index->fwd_fm.index.comp2char[c],
341 fwd_lb,
342 fwd_rb,
343 rev_lb,
344 rev_rb))
345 {
346 ++c;
347 }
348
349 if (c != sigma)
350 {
351 parent_lb = new_parent_lb;
352 parent_rb = new_parent_rb;
353
355 _last_char = static_cast<sdsl_char_type>(c);
356 ++depth;
357
358 return true;
359 }
360 return false;
361 }
362
381 {
382#ifndef NDEBUG
383 fwd_cursor_last_used = false;
384#endif
385
386 assert(index != nullptr);
387
388 size_type new_parent_lb = rev_lb, new_parent_rb = rev_rb;
389
390 sdsl_sigma_type c = 1; // NOTE: start with 0 or 1 depending on implicit_sentintel
391 while (c < sigma
392 && !bidirectional_search(index->rev_fm.index,
393 index->rev_fm.index.comp2char[c],
394 rev_lb,
395 rev_rb,
396 fwd_lb,
397 fwd_rb))
398 {
399 ++c;
400 }
401
402 if (c != sigma)
403 {
404 parent_lb = new_parent_lb;
405 parent_rb = new_parent_rb;
406
408 _last_char = static_cast<sdsl_char_type>(c);
409 ++depth;
410
411 return true;
412 }
413 return false;
414 }
415
429 template <typename char_t>
430 requires std::convertible_to<char_t, index_alphabet_type>
431 bool extend_right(char_t const c) noexcept
432 {
433#ifndef NDEBUG
434 fwd_cursor_last_used = true;
435#endif
436
437 assert(index != nullptr);
438 // The rank cannot exceed 255 for single text and 254 for text collections as they are reserved as sentinels
439 // for the indexed text.
440 assert(seqan3::to_rank(static_cast<index_alphabet_type>(c))
441 < ((index_type::text_layout_mode == text_layout::single) ? 255 : 254));
442
443 size_type new_parent_lb = fwd_lb, new_parent_rb = fwd_rb;
444
445 auto c_char = seqan3::to_rank(static_cast<index_alphabet_type>(c)) + 1;
446 if (bidirectional_search(index->fwd_fm.index, c_char, fwd_lb, fwd_rb, rev_lb, rev_rb))
447 {
448 parent_lb = new_parent_lb;
449 parent_rb = new_parent_rb;
450
451 _last_char = c_char;
452 ++depth;
453
454 return true;
455 }
456 return false;
457 }
458
460 template <typename char_type>
461 requires seqan3::detail::is_char_adaptation_v<char_type>
462 bool extend_right(char_type const * cstring) noexcept
463 {
465 }
466
480 template <typename char_t>
481 requires std::convertible_to<char_t, index_alphabet_type>
482 bool extend_left(char_t const c) noexcept
483 {
484#ifndef NDEBUG
485 fwd_cursor_last_used = false;
486#endif
487
488 assert(index != nullptr);
489 // The rank cannot exceed 255 for single text and 254 for text collections as they are reserved as sentinels
490 // for the indexed text.
491 assert(seqan3::to_rank(static_cast<index_alphabet_type>(c))
492 < ((index_type::text_layout_mode == text_layout::single) ? 255 : 254));
493
494 size_type new_parent_lb = rev_lb, new_parent_rb = rev_rb;
495
496 auto c_char = seqan3::to_rank(static_cast<index_alphabet_type>(c)) + 1;
497 if (bidirectional_search(index->rev_fm.index, c_char, rev_lb, rev_rb, fwd_lb, fwd_rb))
498 {
499 parent_lb = new_parent_lb;
500 parent_rb = new_parent_rb;
501
502 _last_char = c_char;
503 ++depth;
504
505 return true;
506 }
507 return false;
508 }
509
511 template <typename char_type>
512 requires seqan3::detail::is_char_adaptation_v<char_type>
513 bool extend_left(char_type const * cstring) noexcept
514 {
516 }
517
534 template <std::ranges::range seq_t>
535 bool extend_right(seq_t && seq) noexcept
536 {
537 static_assert(std::ranges::forward_range<seq_t>, "The query must model forward_range.");
538 static_assert(std::convertible_to<range_innermost_value_t<seq_t>, index_alphabet_type>,
539 "The alphabet of the sequence must be convertible to the alphabet of the index.");
540
541 assert(index != nullptr);
542
543 auto first = std::ranges::begin(seq);
544 auto last = std::ranges::end(seq);
545
546#ifndef NDEBUG
547 fwd_cursor_last_used = (first != last); // only if seq was not empty
548#endif
549
550 size_type _fwd_lb = fwd_lb, _fwd_rb = fwd_rb, _rev_lb = rev_lb, _rev_rb = rev_rb;
551 size_type new_parent_lb = parent_lb, new_parent_rb = parent_rb;
552 sdsl_char_type c = _last_char;
553 size_t len{0};
554
555 for (auto it = first; it != last; ++len, ++it)
556 {
557 // The rank cannot exceed 255 for single text and 254 for text collections as they are reserved as sentinels
558 // for the indexed text.
559 assert(seqan3::to_rank(static_cast<index_alphabet_type>(*it))
560 < ((index_type::text_layout_mode == text_layout::single) ? 255 : 254));
561
562 c = seqan3::to_rank(static_cast<index_alphabet_type>(*it)) + 1;
563
566 if (!bidirectional_search(index->fwd_fm.index, c, _fwd_lb, _fwd_rb, _rev_lb, _rev_rb))
567 return false;
568 }
569
570 fwd_lb = _fwd_lb;
571 fwd_rb = _fwd_rb;
572 rev_lb = _rev_lb;
573 rev_rb = _rev_rb;
574
575 parent_lb = new_parent_lb;
576 parent_rb = new_parent_rb;
577
578 _last_char = c;
579 depth += len;
580
581 return true;
582 }
583
604 template <std::ranges::range seq_t>
605 bool extend_left(seq_t && seq) noexcept
606 {
607 static_assert(std::ranges::bidirectional_range<seq_t>, "The query must model bidirectional_range.");
608 static_assert(std::convertible_to<range_innermost_value_t<seq_t>, index_alphabet_type>,
609 "The alphabet of the sequence must be convertible to the alphabet of the index.");
610 assert(index != nullptr);
611
612 auto rev_seq = std::views::reverse(seq);
613 auto first = std::ranges::begin(rev_seq);
614 auto last = std::ranges::end(rev_seq);
615
616#ifndef NDEBUG
617 if (first != last) // only if seq was not empty
618 fwd_cursor_last_used = false;
619#endif
620
621 size_type _fwd_lb = fwd_lb, _fwd_rb = fwd_rb, _rev_lb = rev_lb, _rev_rb = rev_rb;
622 size_type new_parent_lb = parent_lb, new_parent_rb = parent_rb;
623 sdsl_char_type c = _last_char;
624 size_t len{0};
625
626 for (auto it = first; it != last; ++len, ++it)
627 {
628 // The rank cannot exceed 255 for single text and 254 for text collections as they are reserved as sentinels
629 // for the indexed text.
630 assert(seqan3::to_rank(static_cast<index_alphabet_type>(*it))
631 < ((index_type::text_layout_mode == text_layout::single) ? 255 : 254));
632
633 c = seqan3::to_rank(static_cast<index_alphabet_type>(*it)) + 1;
634
637 if (!bidirectional_search(index->rev_fm.index, c, _rev_lb, _rev_rb, _fwd_lb, _fwd_rb))
638 return false;
639 }
640
641 fwd_lb = _fwd_lb;
642 fwd_rb = _fwd_rb;
643 rev_lb = _rev_lb;
644 rev_rb = _rev_rb;
645
646 parent_lb = new_parent_lb;
647 parent_rb = new_parent_rb;
648 _last_char = c;
649 depth += len;
650
651 return true;
652 }
653
681 {
682#ifndef NDEBUG
683 // cycle_back() can only be used if the last extension was to the right.
684 assert(fwd_cursor_last_used);
685#endif
686
687 assert(index != nullptr && query_length() > 0);
688
689 sdsl_sigma_type c = _last_char + 1;
690
691 while (c < sigma
692 && !bidirectional_search_cycle(index->fwd_fm.index,
693 index->fwd_fm.index.comp2char[c],
694 parent_lb,
695 parent_rb,
696 fwd_lb,
697 fwd_rb,
698 rev_lb,
699 rev_rb))
700 {
701 ++c;
702 }
703
704 if (c != sigma)
705 {
707 _last_char = static_cast<sdsl_char_type>(c);
708
709 return true;
710 }
711 return false;
712 }
713
741 {
742#ifndef NDEBUG
743 // cycle_front() can only be used if the last extension was to the left.
744 assert(!fwd_cursor_last_used);
745#endif
746
747 assert(index != nullptr && query_length() > 0);
748
749 sdsl_sigma_type c = _last_char + 1;
750 while (c < sigma
751 && !bidirectional_search_cycle(index->rev_fm.index,
752 index->rev_fm.index.comp2char[c],
753 parent_lb,
754 parent_rb,
755 rev_lb,
756 rev_rb,
757 fwd_lb,
758 fwd_rb))
759 {
760 ++c;
761 }
762
763 if (c != sigma)
764 {
766 _last_char = static_cast<sdsl_char_type>(c);
767
768 return true;
769 }
770 return false;
771 }
772
790 {
791 assert(index != nullptr && query_length() > 0);
792
793 return index->fwd_fm.index.comp2char[_last_char] - 1; // text is not allowed to contain ranks of 0
794 }
795
809 {
810 assert(index != nullptr);
811 // depth == 0 -> root node
812 assert(depth != 0 || (fwd_lb == rev_lb && fwd_rb == rev_rb && fwd_lb == 0 && fwd_rb == index->size() - 1));
813
814 return depth;
815 }
816
837 {
838 assert(index != nullptr);
839
840 fwd_cursor cur{index->fwd_fm};
841 cur.parent_lb = parent_lb;
842 cur.parent_rb = parent_rb;
843 cur.node = {fwd_lb, fwd_rb, depth, _last_char};
844
845#ifndef NDEBUG
846 if (!fwd_cursor_last_used)
847 {
848 // invalidate parent interval
849 cur.parent_lb = 1;
850 cur.parent_rb = 0;
851 }
852#endif
853
854 return cur;
855 }
856
873 template <std::ranges::range text_t>
874 auto path_label(text_t && text) const noexcept
875 requires (index_t::text_layout_mode == text_layout::single)
876 {
877 static_assert(std::ranges::input_range<text_t>, "The text must model input_range.");
878 static_assert(range_dimension_v<text_t> == 1, "The input cannot be a text collection.");
879 static_assert(std::same_as<range_innermost_value_t<text_t>, index_alphabet_type>,
880 "The alphabet types of the given text and index differ.");
881 assert(index != nullptr);
882
883 size_type const query_begin = offset() - index->fwd_fm.index[fwd_lb];
885 }
886
888 template <std::ranges::range text_t>
889 auto path_label(text_t && text) const noexcept
890 requires (index_t::text_layout_mode == text_layout::collection)
891 {
892 static_assert(std::ranges::input_range<text_t>, "The text collection must model input_range.");
893 static_assert(range_dimension_v<text_t> == 2, "The input must be a text collection.");
894 static_assert(std::same_as<range_innermost_value_t<text_t>, index_alphabet_type>,
895 "The alphabet types of the given text and index differ.");
896 assert(index != nullptr);
897
898 // Position of query in concatenated text.
899 size_type const location = offset() - index->fwd_fm.index[fwd_lb];
900
901 // The rank represents the number of start positions of the individual sequences/texts in the collection
902 // before position `location + 1` and thereby also the number of delimiters.
903 size_type const rank = index->fwd_fm.text_begin_rs.rank(location + 1);
904 assert(rank > 0);
905 size_type const text_id = rank - 1;
906
907 // The start location of the `text_id`-th text in the sequence (position of the `rank`-th 1 in the bitvector).
908 size_type const start_location = index->fwd_fm.text_begin_ss.select(rank);
909 // Substract lengths of previous sequences.
911
912 // Take subtext, slice query out of it
914 }
915
928 {
929 assert(index != nullptr && (1 + fwd_rb - fwd_lb == 1 + rev_rb - rev_lb));
930
931 return 1 + fwd_rb - fwd_lb;
932 }
933
946 requires (index_t::text_layout_mode == text_layout::single)
947 {
948 assert(index != nullptr);
949
951 occ.reserve(count());
952 for (size_type i = 0; i < count(); ++i)
953 {
954 occ.emplace_back(0, offset() - index->fwd_fm.index[fwd_lb + i]);
955 }
956 return occ;
957 }
958
961 requires (index_t::text_layout_mode == text_layout::collection)
962 {
963 assert(index != nullptr);
964
966 occ.reserve(count());
967 for (size_type i = 0; i < count(); ++i)
968 {
969 size_type loc = offset() - index->fwd_fm.index[fwd_lb + i];
970 size_type sequence_rank = index->fwd_fm.text_begin_rs.rank(loc + 1);
971 size_type sequence_position = loc - index->fwd_fm.text_begin_ss.select(sequence_rank);
972 occ.emplace_back(sequence_rank - 1, sequence_position);
973 }
974 return occ;
975 }
976
990 requires (index_t::text_layout_mode == text_layout::single)
991 {
992 assert(index != nullptr);
993
994 return std::views::iota(fwd_lb, fwd_lb + count())
995 | std::views::transform(
996 [*this, _offset = offset()](auto sa_pos)
997 {
998 return locate_result_value_type{0u, _offset - index->fwd_fm.index[sa_pos]};
999 });
1000 }
1001
1004 requires (index_t::text_layout_mode == text_layout::collection)
1005 {
1006 assert(index != nullptr);
1007
1008 return std::views::iota(fwd_lb, fwd_lb + count())
1009 | std::views::transform(
1010 [*this, _offset = offset()](auto sa_pos)
1011 {
1012 auto loc = _offset - index->fwd_fm.index[sa_pos];
1013 size_type sequence_rank = index->fwd_fm.text_begin_rs.rank(loc + 1);
1014 size_type sequence_position = loc - index->fwd_fm.text_begin_ss.select(sequence_rank);
1015 return locate_result_value_type{sequence_rank - 1, sequence_position};
1016 });
1017 }
1018
1026 template <cereal_archive archive_t>
1028 {
1029 archive(fwd_lb);
1030 archive(fwd_rb);
1031 archive(rev_lb);
1032 archive(rev_rb);
1033 archive(sigma);
1034 archive(parent_lb);
1035 archive(parent_rb);
1036 archive(_last_char);
1037 archive(depth);
1038 }
1040};
1041
1042} // namespace seqan3
Core alphabet concept and free function/type trait wrappers.
T begin(T... args)
Provides alphabet adaptations for standard char types.
The SeqAn Bidirectional FM Index Cursor.
Definition bi_fm_index_cursor.hpp:51
bool extend_right() noexcept
Tries to extend the query by the smallest possible character to the right such that the query is foun...
Definition bi_fm_index_cursor.hpp:327
size_type count() const noexcept
Counts the number of occurrences of the searched query in the text.
Definition bi_fm_index_cursor.hpp:927
bool extend_left(seq_t &&seq) noexcept
Tries to extend the query by seq to the left.
Definition bi_fm_index_cursor.hpp:605
bool operator==(bi_fm_index_cursor const &rhs) const noexcept
Compares two cursors.
Definition bi_fm_index_cursor.hpp:281
bool extend_left(char_type const *cstring) noexcept
This is an overloaded member function, provided for convenience. It differs from the above function o...
Definition bi_fm_index_cursor.hpp:513
auto path_label(text_t &&text) const noexcept
Returns the searched query.
Definition bi_fm_index_cursor.hpp:874
bool extend_left() noexcept
Tries to extend the query by the smallest possible character to the left such that the query is found...
Definition bi_fm_index_cursor.hpp:380
auto path_label(text_t &&text) const noexcept
This is an overloaded member function, provided for convenience. It differs from the above function o...
Definition bi_fm_index_cursor.hpp:889
locate_result_type locate() const
Locates the occurrences of the searched query in the text.
Definition bi_fm_index_cursor.hpp:945
bool cycle_back() noexcept
Tries to replace the rightmost character of the query by the next lexicographically larger character ...
Definition bi_fm_index_cursor.hpp:680
bool cycle_front() noexcept
Tries to replace the leftmost character of the query by the next lexicographically larger character s...
Definition bi_fm_index_cursor.hpp:740
auto lazy_locate() const
This is an overloaded member function, provided for convenience. It differs from the above function o...
Definition bi_fm_index_cursor.hpp:1003
fwd_cursor to_fwd_cursor() const noexcept
Returns a unidirectional seqan3::fm_index_cursor on the original text. path_label() on the returned u...
Definition bi_fm_index_cursor.hpp:836
size_type query_length() const noexcept
Returns the depth of the cursor node in the implicit suffix tree, i.e. the length of the sequence sea...
Definition bi_fm_index_cursor.hpp:808
bool extend_right(char_type const *cstring) noexcept
This is an overloaded member function, provided for convenience. It differs from the above function o...
Definition bi_fm_index_cursor.hpp:462
size_type last_rank() noexcept
Outputs the rightmost respectively leftmost rank depending on whether extend_right() or extend_left()...
Definition bi_fm_index_cursor.hpp:789
index_t index_type
Type of the index.
Definition bi_fm_index_cursor.hpp:54
typename index_type::size_type size_type
Type for representing positions in the indexed text.
Definition bi_fm_index_cursor.hpp:60
bool operator!=(bi_fm_index_cursor const &rhs) const noexcept
Compares two cursors.
Definition bi_fm_index_cursor.hpp:303
std::vector< std::pair< size_type, size_type > > locate() const
This is an overloaded member function, provided for convenience. It differs from the above function o...
Definition bi_fm_index_cursor.hpp:960
bi_fm_index_cursor() noexcept=default
Default constructor. Accessing member functions on a default constructed object is undefined behavior...
auto lazy_locate() const
Locates the occurrences of the searched query in the text on demand, i.e. a std::ranges::view is retu...
Definition bi_fm_index_cursor.hpp:989
bool extend_right(seq_t &&seq) noexcept
Tries to extend the query by seq to the right.
Definition bi_fm_index_cursor.hpp:535
bool extend_right(char_t const c) noexcept
Tries to extend the query by the character c to the right.
Definition bi_fm_index_cursor.hpp:431
bool extend_left(char_t const c) noexcept
Tries to extend the query by the character c to the left.
Definition bi_fm_index_cursor.hpp:482
A "pretty printer" for most SeqAn data structures and related types.
Definition debug_stream_type.hpp:79
The SeqAn FM Index Cursor.
Definition fm_index_cursor.hpp:83
The SeqAn FM Index.
Definition fm_index.hpp:185
Provides various transformation traits used by the range module.
Provides the unidirectional seqan3::fm_index.
Provides the seqan3::fm_index_cursor for searching in the unidirectional seqan3::fm_index.
constexpr auto to_rank
Return the rank representation of a (semi-)alphabet object.
Definition alphabet/concept.hpp:152
@ seq
The "sequence", usually a range of nucleotides or amino acids.
text_layout
The possible text layouts (single, collection) the seqan3::fm_index and seqan3::bi_fm_index can suppo...
Definition search/fm_index/concept.hpp:69
@ single
The text is a single range.
Definition search/fm_index/concept.hpp:71
@ collection
The text is a range of ranges.
Definition search/fm_index/concept.hpp:73
constexpr auto slice
A view adaptor that returns a half-open interval on the underlying range.
Definition slice.hpp:137
The main SeqAn3 namespace.
Definition aligned_sequence_concept.hpp:26
Provides seqan3::views::slice.
T tie(T... args)
Provides alphabet adaptations for standard uint types.
Hide me