SeqAn3 3.4.0-rc.1
The Modern C++ library for sequence analysis.
Loading...
Searching...
No Matches
wuss.hpp
Go to the documentation of this file.
1// SPDX-FileCopyrightText: 2006-2024 Knut Reinert & Freie Universität Berlin
2// SPDX-FileCopyrightText: 2016-2024 Knut Reinert & MPI für molekulare Genetik
3// SPDX-License-Identifier: BSD-3-Clause
4
10#pragma once
11
12#include <cmath>
13#include <limits>
14#include <vector>
15
19
20// ------------------------------------------------------------------
21// wuss
22// ------------------------------------------------------------------
23
24namespace seqan3
25{
26
56template <uint8_t SIZE = 51>
57class wuss : public alphabet_base<wuss<SIZE>, SIZE>
58{
59 static_assert(SIZE >= 15 && SIZE <= 67 && SIZE % 2 == 1,
60 "The wuss<> alphabet size must be an odd number in range 15..67.");
61
62private:
64 using base_t = alphabet_base<wuss<SIZE>, SIZE>;
65
67 friend base_t;
68
69protected:
72
73public:
75 using base_t::to_char;
76 using base_t::to_rank;
77
81 constexpr wuss() noexcept = default;
87
89
99 {
100 return interaction_tab[to_rank()] < 0;
101 }
102
108 constexpr bool is_pair_close() const noexcept
109 {
110 return interaction_tab[to_rank()] > 0;
111 }
112
118 constexpr bool is_unpaired() const noexcept
119 {
120 return interaction_tab[to_rank()] == 0;
121 }
122
128 // formula: (alphabet size - 7 unpaired characters) / 2, as every bracket exists as opening/closing pair
129 static constexpr uint8_t max_pseudoknot_depth{static_cast<uint8_t>((alphabet_size - 7) / 2)};
130
140 {
141 if (interaction_tab[to_rank()] != 0)
142 return std::abs(interaction_tab[to_rank()]) - 1;
143 else
144 return std::nullopt; // unpaired
145 }
147
148private:
150 static constexpr char_type rank_to_char(rank_type const rank)
151 {
152 return rank_to_char_table[rank];
153 }
154
156 static constexpr rank_type char_to_rank(char_type const chr)
157 {
158 using index_t = std::make_unsigned_t<char_type>;
159 return char_to_rank_table[static_cast<index_t>(chr)];
160 }
161
163 static constexpr std::array<char_type, alphabet_size> rank_to_char_table{
164 []() constexpr
165 {
167 chars{'.', ':', ',', '-', '_', '~', ';', '<', '(', '[', '{', '>', ')', ']', '}'};
168
169 // pseudoknot letters
170 for (rank_type rnk = 15u; rnk + 1u < alphabet_size; rnk += 2u)
171 {
172 char_type const off = static_cast<char_type>((rnk - 15u) / 2u);
173 chars[rnk] = 'A' + off;
174 chars[rnk + 1u] = 'a' + off;
175 }
176
177 return chars;
178 }()};
179
181 static constexpr std::array<rank_type, 256> char_to_rank_table{[]() constexpr
182 {
183 std::array<rank_type, 256> rank_table{};
184
185 rank_table.fill(6u);
186
187 // set alphabet values
188 for (rank_type rnk = 0u; rnk < alphabet_size;
189 ++rnk)
190 rank_table[rank_to_char_table[rnk]] = rnk;
191
192 return rank_table;
193 }()};
194
198 static constexpr std::array<int8_t, SIZE> interaction_tab{
199 []() constexpr
200 {
201 static_assert(static_cast<int16_t>(std::numeric_limits<int8_t>::max()) >= SIZE);
202 static_assert(-static_cast<int16_t>(std::numeric_limits<int8_t>::min()) >= SIZE);
203
204 std::array<int8_t, alphabet_size> interaction_table{};
205 int8_t cnt_open = 0;
206 int8_t cnt_close = 0;
207
208 for (rank_type rnk = 0u; rnk <= 6u; ++rnk)
209 interaction_table[rnk] = 0;
210
211 for (rank_type rnk = 7u; rnk <= 10u; ++rnk)
212 interaction_table[rnk] = --cnt_open;
213
214 for (rank_type rnk = 11u; rnk <= 14u; ++rnk)
215 interaction_table[rnk] = ++cnt_close;
216
217 for (rank_type rnk = 15u; rnk + 1u < alphabet_size; rnk += 2u)
218 {
219 interaction_table[rnk] = --cnt_open;
220 interaction_table[rnk + 1u] = ++cnt_close;
221 }
222
223 return interaction_table;
224 }()};
225};
226
231
232inline namespace literals
233{
234
248constexpr wuss51 operator""_wuss51(char const ch) noexcept
249{
250 return wuss51{}.assign_char(ch);
251}
252
265{
267 vec.resize(len);
268
269 for (size_t idx = 0ul; idx < len; ++idx)
270 vec[idx].assign_char(str[idx]);
271
272 return vec;
273}
275
276} // namespace literals
277
278} // namespace seqan3
Provides seqan3::rna_structure_alphabet.
Provides seqan3::alphabet_base.
A CRTP-base that makes defining a custom alphabet easier.
Definition alphabet_base.hpp:54
constexpr rank_type to_rank() const noexcept
Return the letter's numeric value (rank in the alphabet).
Definition alphabet_base.hpp:134
detail::min_viable_uint_t< size - 1 > rank_type
The type of the alphabet when represented as a number (e.g. via to_rank()).
Definition alphabet_base.hpp:77
static constexpr detail::min_viable_uint_t< size > alphabet_size
The size of the alphabet, i.e. the number of different values it can take.
Definition alphabet_base.hpp:196
constexpr char_type to_char() const noexcept
Return the letter as a character of char_type.
Definition alphabet_base.hpp:112
std::conditional_t< std::same_as< char_t, void >, char, char_t > char_type
The char representation; conditional needed to make semi alphabet definitions legal.
Definition alphabet_base.hpp:69
A "pretty printer" for most SeqAn data structures and related types.
Definition debug_stream_type.hpp:79
The WUSS structure alphabet of the characters .<>:,-_~;()[]{}AaBbCcDd...
Definition wuss.hpp:58
static constexpr uint8_t max_pseudoknot_depth
The ability of this alphabet to represent pseudoknots, i.e. crossing interactions,...
Definition wuss.hpp:129
constexpr bool is_pair_close() const noexcept
Check whether the character represents a leftward interaction in an RNA structure.
Definition wuss.hpp:108
constexpr bool is_pair_open() const noexcept
Check whether the character represents a rightward interaction in an RNA structure.
Definition wuss.hpp:98
constexpr std::optional< uint8_t > pseudoknot_id() const noexcept
Get an identifier for a pseudoknotted interaction, where opening and closing brackets of the same typ...
Definition wuss.hpp:139
detail::min_viable_uint_t< size - 1 > rank_type
The type of the alphabet when represented as a number (e.g. via to_rank()).
Definition alphabet_base.hpp:77
static constexpr detail::min_viable_uint_t< size > alphabet_size
The size of the alphabet, i.e. the number of different values it can take.
Definition alphabet_base.hpp:196
constexpr wuss() noexcept=default
Defaulted.
constexpr bool is_unpaired() const noexcept
Check whether the character represents an unpaired position in an RNA structure.
Definition wuss.hpp:118
std::conditional_t< std::same_as< char_t, void >, char, char_t > char_type
The char representation; conditional needed to make semi alphabet definitions legal.
Definition alphabet_base.hpp:69
T fill(T... args)
constexpr auto to_rank
Return the rank representation of a (semi-)alphabet object.
Definition alphabet/concept.hpp:152
T max(T... args)
T min(T... args)
The main SeqAn3 namespace.
Definition aligned_sequence_concept.hpp:26
@ off
Automatic update notifications should be disabled.
#define SEQAN3_WORKAROUND_LITERAL
Our char literals returning std::vector should be constexpr if constexpr std::vector is supported.
Definition platform.hpp:269
Provides utilities for modifying characters.
Hide me