SeqAn3  3.0.3
The Modern C++ library for sequence analysis.
nucleotide_base.hpp
Go to the documentation of this file.
1 // -----------------------------------------------------------------------------------------------------
2 // Copyright (c) 2006-2020, Knut Reinert & Freie Universität Berlin
3 // Copyright (c) 2016-2020, Knut Reinert & MPI für molekulare Genetik
4 // This file may be used, modified and/or redistributed under the terms of the 3-clause BSD-License
5 // shipped with this file and also available at: https://github.com/seqan/seqan3/blob/master/LICENSE.md
6 // -----------------------------------------------------------------------------------------------------
7 
13 #pragma once
14 
19 
20 namespace seqan3
21 {
22 
41 template <typename derived_type, auto size>
42 class nucleotide_base : public alphabet_base<derived_type, size, char>
43 {
44 private:
47 
51  constexpr nucleotide_base() noexcept = default;
52  constexpr nucleotide_base(nucleotide_base const &) noexcept = default;
53  constexpr nucleotide_base(nucleotide_base &&) noexcept = default;
54  constexpr nucleotide_base & operator=(nucleotide_base const &) noexcept = default;
55  constexpr nucleotide_base & operator=(nucleotide_base &&) noexcept = default;
56  ~nucleotide_base() noexcept = default;
57 
59 
61  friend derived_type;
62 
63 protected:
64  // Import from base:
65  using typename base_t::char_type;
66  using typename base_t::rank_type;
67 
68 public:
69  using base_t::alphabet_size;
70  using base_t::to_rank;
71 
75  // This constructor needs to be public, because constructor templates are not inherited otherwise
80  template <typename other_nucl_type>
82  requires (!std::same_as<nucleotide_base, other_nucl_type>) &&
83  (!std::same_as<derived_type, other_nucl_type>) &&
84  nucleotide_alphabet<other_nucl_type>
86  explicit constexpr nucleotide_base(other_nucl_type const & other) noexcept
87  {
88  static_cast<derived_type &>(*this) =
89  detail::convert_through_char_representation<derived_type, other_nucl_type>[seqan3::to_rank(other)];
90  }
92 
115  constexpr derived_type complement() const noexcept
116  {
117  return derived_type::complement_table[to_rank()];
118  }
120 
142  static constexpr bool char_is_valid(char_type const c) noexcept
143  {
144  return valid_char_table[static_cast<uint8_t>(c)];
145  }
146 
147 private:
150  {
151  [] () constexpr
152  {
153  // init with false
154  std::array<bool, 256> ret{};
155 
156  // the original valid chars and their lower cases
157  for (size_t rank = 0u; rank < derived_type::alphabet_size; ++rank)
158  {
159  uint8_t c{};
160 #ifdef SEQAN3_DEPRECATED_310
161  if constexpr (detail::has_rank_to_char_table<derived_type>)
162  c = derived_type::rank_to_char[rank];
163  else
164  c = derived_type::rank_to_char(rank);
165 #else // ^^^ before 3.1.0 release / after 3.1.0 release vvv
166  c = derived_type::rank_to_char(rank);
167 #endif // SEQAN3_DEPRECATED_310
168  ret[c] = true;
169  ret[to_lower(c)] = true;
170  }
171 
172  // U and T shall be accepted for all
173  ret['U'] = true;
174  ret['T'] = true;
175  ret['u'] = true;
176  ret['t'] = true;
177 
178  return ret;
179  }()
180  };
181 };
182 
183 } // namespace seqan3
Provides seqan3::detail::convert_through_char_representation.
Provides seqan3::nucleotide_alphabet.
Provides seqan3::alphabet_base.
A CRTP-base that makes defining a custom alphabet easier.
Definition: alphabet_base.hpp:81
constexpr rank_type to_rank() const noexcept
Return the letter's numeric value (rank in the alphabet).
Definition: alphabet_base.hpp:185
static constexpr detail::min_viable_uint_t< size > alphabet_size
The size of the alphabet, i.e. the number of different values it can take.
Definition: alphabet_base.hpp:276
rank_type rank
The value of the alphabet letter is stored as the rank.
Definition: alphabet_base.hpp:338
A CRTP-base that refines seqan3::alphabet_base and is used by the nucleotides.
Definition: nucleotide_base.hpp:43
static constexpr std::array< bool, 256 > valid_char_table
Implementation of char_is_valid().
Definition: nucleotide_base.hpp:150
friend derived_type
Befriend the derived_type so it can instantiate.
Definition: nucleotide_base.hpp:61
static constexpr bool char_is_valid(char_type const c) noexcept
Validate whether a character value has a one-to-one mapping to an alphabet value.
Definition: nucleotide_base.hpp:142
constexpr nucleotide_base() noexcept=default
Defaulted.
constexpr derived_type complement() const noexcept
Return the complement of the letter.
Definition: nucleotide_base.hpp:115
constexpr auto alphabet_size
A type trait that holds the size of a (semi-)alphabet.
Definition: concept.hpp:858
constexpr auto to_rank
Return the rank representation of a (semi-)alphabet object.
Definition: concept.hpp:155
A concept that indicates whether an alphabet represents nucleotides.
The main SeqAn3 namespace.
Definition: aligned_sequence_concept.hpp:29
constexpr char_type to_lower(char_type const c) noexcept
Converts 'A'-'Z' to 'a'-'z' respectively; other characters are returned as is.
Definition: transform.hpp:81
SeqAn specific customisations in the standard namespace.
Provides utilities for modifying characters.