26#include <seqan3/io/detail/record.hpp>
60template <detail::fields_specialisation selected_field_ids_ = fields<
field::seq,
71 detail::type_list_of_sam_file_output_formats valid_formats_ = type_list<format_sam, format_bam>,
72 typename ref_ids_type = ref_info_not_given>
102 "The field::offset is deprecated. It is already stored in the field::cigar as soft clipping (S) "
103 "at the front and not needed otherwise.");
106 "The seqan3::field::alignment was removed from the allowed fields for seqan3::sam_file_output. "
107 "Only seqan3::field::cigar is supported. seqan3::cigar_from_alignment on how to get a CIGAR string "
108 "from an alignment.");
113 for (
field f : selected_field_ids::as_array)
114 if (!field_ids::contains(f))
118 "You selected a field that is not valid for SAM files, "
119 "please refer to the documentation of "
120 "seqan3::sam_file_output::field_ids for the accepted values.");
138 using iterator = detail::out_file_iterator<sam_file_output>;
161 if (header_has_been_written)
164 assert(!format.valueless_by_exception());
169 if constexpr (std::same_as<ref_ids_type, ref_info_not_given>)
170 f.write_header(*secondary_stream,
options, std::ignore);
172 f.write_header(*secondary_stream,
options, *header_ptr);
206 primary_stream->rdbuf()->pubsetbuf(stream_buffer.
data(), stream_buffer.
size());
208 ->open(filename, std::ios_base::out | std::ios::binary);
211 if (!primary_stream->good())
212 throw file_open_error{
"Could not open file " + filename.
string() +
" for writing."};
215 secondary_stream = detail::make_secondary_ostream(*primary_stream, filename);
218 detail::set_format(format, filename);
237 template <output_stream stream_type, sam_file_output_format file_format>
238 requires std::same_as<typename std::remove_reference_t<stream_type>::char_type,
stream_char_type>
240 file_format
const & SEQAN3_DOXYGEN_ONLY(format_tag),
242 primary_stream{&stream, stream_deleter_noop},
243 secondary_stream{&stream, stream_deleter_noop},
244 format{detail::sam_file_output_format_exposer<file_format>{}}
246 static_assert(list_traits::contains<file_format, valid_formats>,
247 "You selected a format that is not in the valid_formats of this file.");
251 template <output_stream stream_type, sam_file_output_format file_format>
252 requires std::same_as<typename std::remove_reference_t<stream_type>::char_type,
stream_char_type>
254 file_format
const & SEQAN3_DOXYGEN_ONLY(format_tag),
256 primary_stream{
new stream_type{std::move(stream)}, stream_deleter_default},
257 secondary_stream{&*primary_stream, stream_deleter_noop},
258 format{detail::sam_file_output_format_exposer<file_format>{}}
260 static_assert(list_traits::contains<file_format, valid_formats>,
261 "You selected a format that is not in the valid_formats of this file.");
294 template <
typename ref_
ids_type_, std::ranges::forward_range ref_lengths_type>
295 requires std::same_as<std::remove_reference_t<ref_ids_type_>, ref_ids_type>
297 ref_ids_type_ && ref_ids,
298 ref_lengths_type && ref_lengths,
303 initialise_header_information(std::forward<ref_ids_type_>(ref_ids),
304 std::forward<ref_lengths_type>(ref_lengths));
328 template <output_stream stream_type,
329 sam_file_output_format file_format,
330 typename ref_ids_type_,
331 std::ranges::forward_range ref_lengths_type>
332 requires std::same_as<std::remove_reference_t<ref_ids_type_>, ref_ids_type>
334 ref_ids_type_ && ref_ids,
335 ref_lengths_type && ref_lengths,
336 file_format
const & SEQAN3_DOXYGEN_ONLY(format_tag),
340 initialise_header_information(std::forward<ref_ids_type_>(ref_ids),
341 std::forward<ref_lengths_type>(ref_lengths));
408 template <
typename record_t>
410 requires detail::record_like<record_t>
414 write_record(detail::get_or<field::header_ptr>(r,
nullptr),
419 detail::get_or<field::ref_id>(r, std::ignore),
423 detail::get_or<field::mapq>(r, 0u),
424 detail::get_or<field::mate>(r, default_mate_t{}),
426 detail::get_or<field::evalue>(r, 0u),
427 detail::get_or<field::bit_score>(r, 0u));
451 template <
typename tuple_t>
458 write_record(detail::get_or<selected_field_ids::index_of(
field::header_ptr)>(t,
nullptr),
463 detail::get_or<selected_field_ids::index_of(
field::ref_id)>(t, std::ignore),
467 detail::get_or<selected_field_ids::index_of(
field::mapq)>(t, 0u),
468 detail::get_or<selected_field_ids::index_of(
field::mate)>(t, default_mate_t{}),
470 detail::get_or<selected_field_ids::index_of(
field::evalue)>(t, 0u),
497 template <
typename arg_t,
typename... arg_types>
498 requires (
sizeof...(arg_types) + 1 <= selected_field_ids::size)
525 template <
typename rng_t>
529 for (
auto &&
record : range)
562 template <
typename rng_t>
571 template <
typename rng_t>
588 return *secondary_stream;
604 if constexpr (std::same_as<ref_ids_type, ref_info_not_given>)
605 throw std::logic_error{
"Please construct your file with reference id and length information in order "
606 "to properly initialise the header before accessing it."};
614 bool header_has_been_written{
false};
635 stream_ptr_t primary_stream{
nullptr, stream_deleter_noop};
637 stream_ptr_t secondary_stream{
nullptr, stream_deleter_noop};
640 using format_type =
typename detail::variant_from_tags<valid_formats, detail::sam_file_output_format_exposer>::type;
647 using header_type = sam_file_header<
654 template <
typename ref_
ids_type_,
typename ref_lengths_type>
655 void initialise_header_information(ref_ids_type_ && ref_ids, ref_lengths_type && ref_lengths)
657 assert(std::ranges::size(ref_ids) == std::ranges::size(ref_lengths));
659 header_ptr = std::make_unique<sam_file_header<ref_ids_type>>(std::forward<ref_ids_type_>(ref_ids));
661 for (int32_t idx = 0; idx < std::ranges::distance(
header_ptr->ref_ids()); ++idx)
663 header_ptr->ref_id_info.emplace_back(ref_lengths[idx],
"");
665 if constexpr (std::ranges::contiguous_range<std::ranges::range_reference_t<ref_ids_type_>>
666 && std::ranges::sized_range<std::ranges::range_reference_t<ref_ids_type_>>
667 && std::ranges::borrowed_range<std::ranges::range_reference_t<ref_ids_type_>>)
680 template <
typename record_header_ptr_t,
typename... pack_type>
681 void write_record(record_header_ptr_t && record_header_ptr, pack_type &&... remainder)
683 static_assert((
sizeof...(pack_type) == 13),
"Wrong parameter list passed to write_record.");
685 assert(!
format.valueless_by_exception());
691 if constexpr (!std::same_as<record_header_ptr_t, std::nullptr_t>)
693 f.write_alignment_record(*secondary_stream,
696 std::forward<pack_type>(remainder)...);
698 else if constexpr (std::same_as<ref_ids_type, ref_info_not_given>)
700 f.write_alignment_record(*secondary_stream,
703 std::forward<pack_type>(remainder)...);
707 f.write_alignment_record(*secondary_stream,
710 std::forward<pack_type>(remainder)...);
715 header_has_been_written =
true;
730template <detail::fields_specialisation selected_field_
ids>
737template <output_stream stream_type,
746template <output_stream stream_type,
755template <output_stream stream_type, sam_file_output_format file_format>
762template <output_stream stream_type, sam_file_output_format file_format>
768 std::ranges::forward_range ref_ids_type,
769 std::ranges::forward_range ref_lengths_type>
776template <std::ranges::forward_range ref_
ids_type, std::ranges::forward_range ref_lengths_type>
783template <output_stream stream_type,
784 std::ranges::forward_range ref_ids_type,
785 std::ranges::forward_range ref_lengths_type,
792template <output_stream stream_type,
793 std::ranges::forward_range ref_ids_type,
794 std::ranges::forward_range ref_lengths_type,
801template <output_stream stream_type,
802 std::ranges::forward_range ref_ids_type,
803 std::ranges::forward_range ref_lengths_type,
805sam_file_output(stream_type &&, ref_ids_type &&, ref_lengths_type &&, file_format
const &)
811template <output_stream stream_type,
812 std::ranges::forward_range ref_ids_type,
813 std::ranges::forward_range ref_lengths_type,
815sam_file_output(stream_type &, ref_ids_type &&, ref_lengths_type &&, file_format
const &)
A class for writing SAM files, both SAM and its binary representation BAM are supported.
Definition: io/sam_file/output.hpp:74
sam_file_output(stream_type &, ref_ids_type &&, ref_lengths_type &&, file_format const &) -> sam_file_output< typename sam_file_output<>::selected_field_ids, type_list< file_format >, std::remove_reference_t< ref_ids_type > >
Deduces the valid format, and the ref_ids_type from input. selected_field_ids set to the default.
void const_reference
The const reference type (void).
Definition: io/sam_file/output.hpp:132
friend sam_file_output operator|(rng_t &&range, sam_file_output &&f)
This is an overloaded member function, provided for convenience. It differs from the above function o...
Definition: io/sam_file/output.hpp:572
sam_file_output(stream_type &, ref_ids_type &&, ref_lengths_type &&, file_format const &, selected_field_ids const &) -> sam_file_output< selected_field_ids, type_list< file_format >, std::remove_reference_t< ref_ids_type > >
Deduces selected_field_ids, the valid format, and the ref_ids_type from input.
sam_file_output(std::filesystem::path const &, ref_ids_type &&, ref_lengths_type &&) -> sam_file_output< typename sam_file_output<>::selected_field_ids, typename sam_file_output<>::valid_formats, std::remove_reference_t< ref_ids_type > >
Deduces ref_ids_type from input. Valid formats, and selected_field_ids are set to the default.
void size_type
The size type (void).
Definition: io/sam_file/output.hpp:134
sam_file_output & operator=(rng_t &&range)
Write a range of records (or tuples) to the file.
Definition: io/sam_file/output.hpp:526
sam_file_output(sam_file_output const &)=delete
Copy construction is explicitly deleted, because you can't have multiple access to the same file.
sam_file_output()=delete
Default constructor is explicitly deleted, you need to give a stream or file name.
detail::out_file_iterator< sam_file_output > iterator
The iterator type of this view (an output iterator).
Definition: io/sam_file/output.hpp:138
friend sam_file_output & operator|(rng_t &&range, sam_file_output &f)
Write a range of records (or tuples) to the file.
Definition: io/sam_file/output.hpp:563
void emplace_back(arg_t &&arg, arg_types &&... args)
Write a record to the file by passing individual fields.
Definition: io/sam_file/output.hpp:499
std::default_sentinel_t sentinel
The type returned by end().
Definition: io/sam_file/output.hpp:142
char stream_char_type
Character type of the stream(s).
Definition: io/sam_file/output.hpp:85
iterator begin() noexcept
Returns an iterator to current position in the file.
Definition: io/sam_file/output.hpp:366
sentinel end() noexcept
Returns a sentinel for comparison with iterator.
Definition: io/sam_file/output.hpp:385
sam_file_output(std::filesystem::path const &filename, ref_ids_type_ &&ref_ids, ref_lengths_type &&ref_lengths, selected_field_ids const &fields_tag=selected_field_ids{})
Construct from filename.
Definition: io/sam_file/output.hpp:296
~sam_file_output()
The destructor will write the header if it has not been written before.
Definition: io/sam_file/output.hpp:159
sam_file_output(std::filesystem::path, selected_field_ids const &) -> sam_file_output< selected_field_ids, typename sam_file_output<>::valid_formats, ref_info_not_given >
Deduces selected_field_ids from input and sets sam_file_output::ref_ids_type to seqan3::detail::ref_i...
sam_file_output(stream_type &&, ref_ids_type &&, ref_lengths_type &&, file_format const &) -> sam_file_output< typename sam_file_output<>::selected_field_ids, type_list< file_format >, std::remove_reference_t< ref_ids_type > >
Deduces the valid format, and the ref_ids_type from input. selected_field_ids set to the default.
sam_file_output & operator=(sam_file_output &&)=default
Move assignment is defaulted.
selected_field_ids_ selected_field_ids
A seqan3::fields list with the fields selected for the record.
Definition: io/sam_file/output.hpp:81
valid_formats_ valid_formats
A seqan3::type_list with the possible formats.
Definition: io/sam_file/output.hpp:83
sam_file_output & operator=(sam_file_output const &)=delete
Copy assignment is explicitly deleted, because you can't have multiple access to the same file.
sam_file_output(stream_type &&, ref_ids_type &&, ref_lengths_type &&, file_format const &, selected_field_ids const &) -> sam_file_output< selected_field_ids, type_list< file_format >, std::remove_reference_t< ref_ids_type > >
Deduces selected_field_ids, the valid format, and the ref_ids_type from input.
void reference
The reference type (void).
Definition: io/sam_file/output.hpp:130
sam_file_output(stream_type &stream, file_format const &format_tag, selected_field_ids const &fields_tag=selected_field_ids{})
Construct from an existing stream and with specified format.
Definition: io/sam_file/output.hpp:239
void push_back(record_t &&r)
Write a seqan3::record to the file.
Definition: io/sam_file/output.hpp:409
sam_file_output(stream_type &&, file_format const &) -> sam_file_output< typename sam_file_output<>::selected_field_ids, type_list< file_format >, ref_info_not_given >
Deduces the valid format from input and sets sam_file_output::ref_ids_type to seqan3::detail::ref_inf...
sam_file_output(std::filesystem::path filename, selected_field_ids const &fields_tag=selected_field_ids{})
Construct from filename.
Definition: io/sam_file/output.hpp:202
sam_file_output(stream_type &&stream, ref_ids_type_ &&ref_ids, ref_lengths_type &&ref_lengths, file_format const &format_tag, selected_field_ids const &fields_tag=selected_field_ids{})
Construct from an existing stream and with specified format.
Definition: io/sam_file/output.hpp:333
void value_type
The value type (void).
Definition: io/sam_file/output.hpp:128
sam_file_output_options options
The options are public and its members can be set directly.
Definition: io/sam_file/output.hpp:581
sam_file_output(sam_file_output &&)=default
Move construction is defaulted.
sam_file_output(stream_type &&stream, file_format const &format_tag, selected_field_ids const &fields_tag=selected_field_ids{})
This is an overloaded member function, provided for convenience. It differs from the above function o...
Definition: io/sam_file/output.hpp:253
sam_file_output(stream_type &, file_format const &, selected_field_ids const &) -> sam_file_output< selected_field_ids, type_list< file_format >, ref_info_not_given >
Deduces selected_field_ids, and the valid format from input and sets sam_file_output::ref_ids_type to...
sam_file_output(stream_type &&, file_format const &, selected_field_ids const &) -> sam_file_output< selected_field_ids, type_list< file_format >, ref_info_not_given >
Deduces selected_field_ids, and the valid format from input and sets sam_file_output::ref_ids_type to...
void push_back(tuple_t &&t)
Write a record in form of a std::tuple to the file.
Definition: io/sam_file/output.hpp:452
auto & header()
Access the file's header.
Definition: io/sam_file/output.hpp:602
sam_file_output(std::filesystem::path const &, ref_ids_type &&, ref_lengths_type &&, selected_field_ids const &) -> sam_file_output< selected_field_ids, typename sam_file_output<>::valid_formats, std::remove_reference_t< ref_ids_type > >
Deduces selected_field_ids and ref_ids_type from input. valid_formats is set to the default.
void const_iterator
The const iterator type is void, because files are not const-iterable.
Definition: io/sam_file/output.hpp:140
sam_file_output(stream_type &, file_format const &) -> sam_file_output< typename sam_file_output<>::selected_field_ids, type_list< file_format >, ref_info_not_given >
Deduces the valid format from input and sets sam_file_output::ref_ids_type to seqan3::detail::ref_inf...
The SAM tag dictionary class that stores all optional SAM fields.
Definition: sam_tag_dictionary.hpp:343
@ none
None of the flags below are set.
field
An enumerator for the fields used in file formats.
Definition: record.hpp:63
@ flag
The alignment flag (bit information), uint16_t value.
@ ref_offset
Sequence (seqan3::field::ref_seq) relative start position (0-based), unsigned value.
@ ref_seq
The (reference) "sequence" information, usually a range of nucleotides or amino acids.
@ alignment
The (pairwise) alignment stored in an object that models seqan3::detail::pairwise_alignment.
@ cigar
The cigar vector (std::vector<seqan3::cigar>) representing the alignment in SAM/BAM format.
@ mapq
The mapping quality of the seqan3::field::seq alignment, usually a Phred-scaled score.
@ bit_score
The bit score (statistical significance indicator), unsigned value.
@ offset
Sequence (seqan3::field::seq) relative start position (0-based), unsigned value.
@ mate
The mate pair information given as a std::tuple of reference name, offset and template length.
@ header_ptr
A pointer to the seqan3::sam_file_header object storing header information.
@ ref_id
The identifier of the (reference) sequence that seqan3::field::seq was aligned to.
@ evalue
The e-value (length normalized bit score), double value.
@ id
The identifier, usually a string.
@ tags
The optional tags in the SAM format, stored in a dictionary.
@ seq
The "sequence", usually a range of nucleotides or amino acids.
@ qual
The qualities, usually in Phred score notation.
Whether a type behaves like a tuple.
Provides exceptions used in the I/O module.
Provides various utility functions required only for output.
The main SeqAn3 namespace.
Definition: aligned_sequence_concept.hpp:29
Provides the seqan3::detail::out_file_iterator class template.
Provides the seqan3::record template and the seqan3::field enum.
Provides seqan3::detail::record_like.
Provides seqan3::sam_file_output_options.
Provides helper data structures for the seqan3::sam_file_output.
A class template that holds a choice of seqan3::field.
Definition: record.hpp:128
The class template that file records are based on; behaves like a std::tuple.
Definition: record.hpp:193
Type tag which indicates that no reference information has been passed to the SAM file on constructio...
Definition: sam_flag.hpp:24
The options type defines various option members that influence the behavior of all or some formats.
Definition: sam_file/output_options.hpp:26
Type that contains multiple types.
Definition: type_list.hpp:29
Provides traits for seqan3::type_list.
Provides seqan3::tuple_like.