SeqAn3 3.1.0
The Modern C++ library for sequence analysis.
nucleotide_base.hpp
Go to the documentation of this file.
1// -----------------------------------------------------------------------------------------------------
2// Copyright (c) 2006-2021, Knut Reinert & Freie Universität Berlin
3// Copyright (c) 2016-2021, Knut Reinert & MPI für molekulare Genetik
4// This file may be used, modified and/or redistributed under the terms of the 3-clause BSD-License
5// shipped with this file and also available at: https://github.com/seqan/seqan3/blob/master/LICENSE.md
6// -----------------------------------------------------------------------------------------------------
7
13#pragma once
14
16#include <seqan3/alphabet/detail/convert.hpp>
19
20namespace seqan3
21{
22
41template <typename derived_type, auto size>
42class nucleotide_base : public alphabet_base<derived_type, size, char>
43{
44private:
47
51 constexpr nucleotide_base() noexcept = default;
52 constexpr nucleotide_base(nucleotide_base const &) noexcept = default;
53 constexpr nucleotide_base(nucleotide_base &&) noexcept = default;
54 constexpr nucleotide_base & operator=(nucleotide_base const &) noexcept = default;
55 constexpr nucleotide_base & operator=(nucleotide_base &&) noexcept = default;
56 ~nucleotide_base() noexcept = default;
57
59
61 friend derived_type;
62
63protected:
64 // Import from base:
65 using typename base_t::char_type;
66 using typename base_t::rank_type;
67
68public:
70 using base_t::to_rank;
71
75 // This constructor needs to be public, because constructor templates are not inherited otherwise
80 template <typename other_nucl_type>
82 requires (!std::same_as<nucleotide_base, other_nucl_type>) &&
83 (!std::same_as<derived_type, other_nucl_type>) &&
86 explicit constexpr nucleotide_base(other_nucl_type const & other) noexcept
87 {
88 static_cast<derived_type &>(*this) =
89 detail::convert_through_char_representation<derived_type, other_nucl_type>[seqan3::to_rank(other)];
90 }
92
115 constexpr derived_type complement() const noexcept
116 {
117 return derived_type{}.assign_rank(derived_type{}.rank_complement(to_rank()));
118 }
120
142 static constexpr bool char_is_valid(char_type const c) noexcept
143 {
144 return valid_char_table[static_cast<uint8_t>(c)];
145 }
146
147private:
149 static constexpr std::array<bool, 256> valid_char_table
150 {
151 [] () constexpr
152 {
153 // init with false
155
156 // the original valid chars and their lower cases
157 for (size_t rank = 0u; rank < derived_type::alphabet_size; ++rank)
158 {
159 uint8_t c = derived_type::rank_to_char(rank);
160 ret[c] = true;
161 ret[to_lower(c)] = true;
162 }
163
164 // U and T shall be accepted for all
165 ret['U'] = true;
166 ret['T'] = true;
167 ret['u'] = true;
168 ret['t'] = true;
169
170 return ret;
171 }()
172 };
173};
174
175} // namespace seqan3
Provides seqan3::nucleotide_alphabet.
Provides seqan3::alphabet_base.
A CRTP-base that makes defining a custom alphabet easier.
Definition: alphabet_base.hpp:57
constexpr rank_type to_rank() const noexcept
Return the letter's numeric value (rank in the alphabet).
Definition: alphabet_base.hpp:139
detail::min_viable_uint_t< size - 1 > rank_type
The type of the alphabet when represented as a number (e.g. via to_rank()).
Definition: alphabet_base.hpp:80
static constexpr detail::min_viable_uint_t< size > alphabet_size
The size of the alphabet, i.e. the number of different values it can take.
Definition: alphabet_base.hpp:203
std::conditional_t< std::same_as< char, void >, char, char > char_type
The char representation; conditional needed to make semi alphabet definitions legal.
Definition: alphabet_base.hpp:72
A CRTP-base that refines seqan3::alphabet_base and is used by the nucleotides.
Definition: nucleotide_base.hpp:43
static constexpr bool char_is_valid(char_type const c) noexcept
Validate whether a character value has a one-to-one mapping to an alphabet value.
Definition: nucleotide_base.hpp:142
constexpr derived_type complement() const noexcept
Return the complement of the letter.
Definition: nucleotide_base.hpp:115
constexpr nucleotide_base(other_nucl_type const &other) noexcept
Allow explicit construction from any other nucleotide type and convert via the character representati...
Definition: nucleotide_base.hpp:86
constexpr auto alphabet_size
A type trait that holds the size of a (semi-)alphabet.
Definition: concept.hpp:861
constexpr auto to_rank
Return the rank representation of a (semi-)alphabet object.
Definition: concept.hpp:155
A concept that indicates whether an alphabet represents nucleotides.
The main SeqAn3 namespace.
Definition: cigar_operation_table.hpp:2
constexpr char_type to_lower(char_type const c) noexcept
Converts 'A'-'Z' to 'a'-'z' respectively; other characters are returned as is.
Definition: transform.hpp:81
Provides utilities for modifying characters.