26#include <seqan3/io/detail/record.hpp>
144template <detail::fields_specialisation selected_field_ids_ =
158 detail::type_list_of_sam_file_output_formats valid_formats_ = type_list<format_sam, format_bam>,
159 typename ref_ids_type = ref_info_not_given>
190 static_assert([] ()
constexpr
192 for (
field f : selected_field_ids::as_array)
193 if (!field_ids::contains(f))
197 "You selected a field that is not valid for alignment files, "
198 "please refer to the documentation of "
199 "seqan3::sam_file_output::field_ids for the accepted values.");
217 using iterator = detail::out_file_iterator<sam_file_output>;
269 primary_stream->rdbuf()->pubsetbuf(stream_buffer.data(), stream_buffer.size());
271 std::ios_base::out | std::ios::binary);
274 if (!primary_stream->good())
275 throw file_open_error{
"Could not open file " + filename.
string() +
" for writing."};
278 secondary_stream = detail::make_secondary_ostream(*primary_stream, filename);
281 detail::set_format(format, filename);
300 template <output_stream stream_type, sam_file_output_format file_format>
302 requires std::same_as<typename std::remove_reference_t<stream_type>::char_type,
stream_char_type>
305 file_format
const & SEQAN3_DOXYGEN_ONLY(format_tag),
307 primary_stream{&stream, stream_deleter_noop},
308 secondary_stream{&stream, stream_deleter_noop},
309 format{detail::sam_file_output_format_exposer<file_format>{}}
311 static_assert(list_traits::contains<file_format, valid_formats>,
312 "You selected a format that is not in the valid_formats of this file.");
316 template <output_stream stream_type, sam_file_output_format file_format>
318 requires std::same_as<typename std::remove_reference_t<stream_type>::char_type,
stream_char_type>
321 file_format
const & SEQAN3_DOXYGEN_ONLY(format_tag),
323 primary_stream{
new stream_type{std::move(stream)}, stream_deleter_default},
324 secondary_stream{&*primary_stream, stream_deleter_noop},
325 format{detail::sam_file_output_format_exposer<file_format>{}}
327 static_assert(list_traits::contains<file_format, valid_formats>,
328 "You selected a format that is not in the valid_formats of this file.");
361 template <
typename ref_
ids_type_, std::ranges::forward_range ref_lengths_type>
363 requires std::same_as<std::remove_reference_t<ref_ids_type_>, ref_ids_type>
366 ref_ids_type_ && ref_ids,
367 ref_lengths_type && ref_lengths,
372 initialise_header_information(ref_ids, ref_lengths);
396 template <output_stream stream_type,
398 typename ref_ids_type_,
399 std::ranges::forward_range ref_lengths_type>
401 requires std::same_as<std::remove_reference_t<ref_ids_type_>, ref_ids_type>
404 ref_ids_type_ && ref_ids,
405 ref_lengths_type && ref_lengths,
406 file_format
const & SEQAN3_DOXYGEN_ONLY(format_tag),
410 initialise_header_information(ref_ids, ref_lengths);
477 template <
typename record_t>
480 requires detail::record_like<record_t>
486 write_record(detail::get_or<field::header_ptr>(r,
nullptr),
490 detail::get_or<field::offset>(r, 0u),
492 detail::get_or<field::ref_id>(r, std::ignore),
494 detail::get_or<field::alignment>(r, default_align_t{}),
497 detail::get_or<field::mapq>(r, 0u),
498 detail::get_or<field::mate>(r, default_mate_t{}),
500 detail::get_or<field::evalue>(r, 0u),
501 detail::get_or<field::bit_score>(r, 0u));
525 template <
typename tuple_t>
535 write_record(detail::get_or<selected_field_ids::index_of(
field::header_ptr)>(t,
nullptr),
539 detail::get_or<selected_field_ids::index_of(
field::offset)>(t, 0u),
541 detail::get_or<selected_field_ids::index_of(
field::ref_id)>(t, std::ignore),
543 detail::get_or<selected_field_ids::index_of(
field::alignment)>(t, default_align_t{}),
546 detail::get_or<selected_field_ids::index_of(
field::mapq)>(t, 0u),
547 detail::get_or<selected_field_ids::index_of(
field::mate)>(t, default_mate_t{}),
549 detail::get_or<selected_field_ids::index_of(
field::evalue)>(t, 0u),
576 template <
typename arg_t,
typename ...arg_types>
606 template <
typename rng_t>
612 for (
auto &&
record : range)
645 template <
typename rng_t>
656 template <
typename rng_t>
675 return *secondary_stream;
691 if constexpr (std::same_as<ref_ids_type, ref_info_not_given>)
692 throw std::logic_error{
"Please construct your file with reference id and length information in order "
693 "to properly initialise the header before accessing it."};
715 stream_ptr_t primary_stream{
nullptr, stream_deleter_noop};
717 stream_ptr_t secondary_stream{
nullptr, stream_deleter_noop};
720 using format_type =
typename detail::variant_from_tags<
valid_formats,
721 detail::sam_file_output_format_exposer>::type;
728 using header_type = sam_file_header<std::conditional_t<std::same_as<ref_ids_type, ref_info_not_given>,
736 template <
typename ref_
ids_type_,
typename ref_lengths_type>
737 void initialise_header_information(ref_ids_type_ && ref_ids, ref_lengths_type && ref_lengths)
741 header_ptr = std::make_unique<sam_file_header<ref_ids_type>>(std::forward<ref_ids_type_>(ref_ids));
743 for (int32_t idx = 0; idx < std::ranges::distance(ref_ids); ++idx)
745 header_ptr->ref_id_info.emplace_back(ref_lengths[idx],
"");
747 if constexpr (std::ranges::contiguous_range<std::ranges::range_reference_t<ref_ids_type_>> &&
748 std::ranges::sized_range<std::ranges::range_reference_t<ref_ids_type_>> &&
749 std::ranges::borrowed_range<std::ranges::range_reference_t<ref_ids_type_>>)
762 template <
typename record_header_ptr_t,
typename ...pack_type>
763 void write_record(record_header_ptr_t && record_header_ptr, pack_type && ...remainder)
765 static_assert((
sizeof...(pack_type) == 15),
"Wrong parameter list passed to write_record.");
767 assert(!
format.valueless_by_exception());
772 if constexpr (!std::same_as<record_header_ptr_t, std::nullptr_t>)
774 f.write_alignment_record(*secondary_stream,
777 std::forward<pack_type>(remainder)...);
779 else if constexpr (std::same_as<ref_ids_type, ref_info_not_given>)
781 f.write_alignment_record(*secondary_stream,
784 std::forward<pack_type>(remainder)...);
788 f.write_alignment_record(*secondary_stream,
791 std::forward<pack_type>(remainder)...);
808template <detail::fields_specialisation selected_field_
ids>
815template <output_stream stream_type,
824template <output_stream stream_type,
833template <output_stream stream_type,
841template <output_stream stream_type,
848 std::ranges::forward_range ref_ids_type,
849 std::ranges::forward_range ref_lengths_type>
856template <std::ranges::forward_range ref_ids_type,
857 std::ranges::forward_range ref_lengths_type>
864template <output_stream stream_type,
865 std::ranges::forward_range ref_ids_type,
866 std::ranges::forward_range ref_lengths_type,
873template <output_stream stream_type,
874 std::ranges::forward_range ref_ids_type,
875 std::ranges::forward_range ref_lengths_type,
882template <output_stream stream_type,
883 std::ranges::forward_range ref_ids_type,
884 std::ranges::forward_range ref_lengths_type,
886sam_file_output(stream_type &&, ref_ids_type &&, ref_lengths_type &&, file_format
const &)
892template <output_stream stream_type,
893 std::ranges::forward_range ref_ids_type,
894 std::ranges::forward_range ref_lengths_type,
896sam_file_output(stream_type &, ref_ids_type &&, ref_lengths_type &&, file_format
const &)
A class for writing alignment files, e.g. SAM, BAL, BLAST, ...
Definition: output.hpp:161
sam_file_output(stream_type &, ref_ids_type &&, ref_lengths_type &&, file_format const &) -> sam_file_output< typename sam_file_output<>::selected_field_ids, type_list< file_format >, std::remove_reference_t< ref_ids_type > >
Deduces the valid format, and the ref_ids_type from input. selected_field_ids set to the default.
void const_reference
The const reference type (void).
Definition: output.hpp:211
sam_file_output(stream_type &&stream, ref_ids_type_ &&ref_ids, ref_lengths_type &&ref_lengths, file_format const &format_tag, selected_field_ids const &fields_tag=selected_field_ids{})
Construct from an existing stream and with specified format.
Definition: output.hpp:403
sam_file_output(stream_type &, ref_ids_type &&, ref_lengths_type &&, file_format const &, selected_field_ids const &) -> sam_file_output< selected_field_ids, type_list< file_format >, std::remove_reference_t< ref_ids_type > >
Deduces selected_field_ids, the valid format, and the ref_ids_type from input.
sam_file_output(std::filesystem::path const &, ref_ids_type &&, ref_lengths_type &&) -> sam_file_output< typename sam_file_output<>::selected_field_ids, typename sam_file_output<>::valid_formats, std::remove_reference_t< ref_ids_type > >
Deduces ref_ids_type from input. Valid formats, and selected_field_ids are set to the default.
void size_type
The size type (void).
Definition: output.hpp:213
friend sam_file_output & operator|(rng_t &&range, sam_file_output &f)
Write a range of records (or tuples) to the file.
Definition: output.hpp:646
sam_file_output(stream_type &&stream, file_format const &format_tag, selected_field_ids const &fields_tag=selected_field_ids{})
This is an overloaded member function, provided for convenience. It differs from the above function o...
Definition: output.hpp:320
sam_file_output(sam_file_output const &)=delete
Copy construction is explicitly deleted, because you can't have multiple access to the same file.
sam_file_output()=delete
Default constructor is explicitly deleted, you need to give a stream or file name.
sam_file_output & operator=(rng_t &&range)
Write a range of records (or tuples) to the file.
Definition: output.hpp:607
detail::out_file_iterator< sam_file_output > iterator
The iterator type of this view (an output iterator).
Definition: output.hpp:217
std::default_sentinel_t sentinel
The type returned by end().
Definition: output.hpp:221
char stream_char_type
Character type of the stream(s).
Definition: output.hpp:172
sam_file_output(stream_type &stream, file_format const &format_tag, selected_field_ids const &fields_tag=selected_field_ids{})
Construct from an existing stream and with specified format.
Definition: output.hpp:304
iterator begin() noexcept
Returns an iterator to current position in the file.
Definition: output.hpp:435
sentinel end() noexcept
Returns a sentinel for comparison with iterator.
Definition: output.hpp:454
sam_file_output(std::filesystem::path, selected_field_ids const &) -> sam_file_output< selected_field_ids, typename sam_file_output<>::valid_formats, ref_info_not_given >
Deduces selected_field_ids from input and sets sam_file_output::ref_ids_type to seqan3::detail::ref_i...
sam_file_output(stream_type &&, ref_ids_type &&, ref_lengths_type &&, file_format const &) -> sam_file_output< typename sam_file_output<>::selected_field_ids, type_list< file_format >, std::remove_reference_t< ref_ids_type > >
Deduces the valid format, and the ref_ids_type from input. selected_field_ids set to the default.
void emplace_back(arg_t &&arg, arg_types &&... args)
Write a record to the file by passing individual fields.
Definition: output.hpp:580
void push_back(record_t &&r)
Write a seqan3::record to the file.
Definition: output.hpp:478
sam_file_output & operator=(sam_file_output &&)=default
Move assignment is defaulted.
selected_field_ids_ selected_field_ids
A seqan3::fields list with the fields selected for the record.
Definition: output.hpp:168
valid_formats_ valid_formats
A seqan3::type_list with the possible formats.
Definition: output.hpp:170
sam_file_output & operator=(sam_file_output const &)=delete
Copy assignment is explicitly deleted, because you can't have multiple access to the same file.
sam_file_output(stream_type &&, ref_ids_type &&, ref_lengths_type &&, file_format const &, selected_field_ids const &) -> sam_file_output< selected_field_ids, type_list< file_format >, std::remove_reference_t< ref_ids_type > >
Deduces selected_field_ids, the valid format, and the ref_ids_type from input.
void reference
The reference type (void).
Definition: output.hpp:209
sam_file_output(stream_type &&, file_format const &) -> sam_file_output< typename sam_file_output<>::selected_field_ids, type_list< file_format >, ref_info_not_given >
Deduces the valid format from input and sets sam_file_output::ref_ids_type to seqan3::detail::ref_inf...
sam_file_output(std::filesystem::path filename, selected_field_ids const &fields_tag=selected_field_ids{})
Construct from filename.
Definition: output.hpp:265
void push_back(tuple_t &&t)
Write a record in form of a std::tuple to the file.
Definition: output.hpp:526
void value_type
The value type (void).
Definition: output.hpp:207
~sam_file_output()=default
Destructor is defaulted.
sam_file_output_options options
The options are public and its members can be set directly.
Definition: output.hpp:668
sam_file_output(sam_file_output &&)=default
Move construction is defaulted.
sam_file_output(stream_type &, file_format const &, selected_field_ids const &) -> sam_file_output< selected_field_ids, type_list< file_format >, ref_info_not_given >
Deduces selected_field_ids, and the valid format from input and sets sam_file_output::ref_ids_type to...
sam_file_output(stream_type &&, file_format const &, selected_field_ids const &) -> sam_file_output< selected_field_ids, type_list< file_format >, ref_info_not_given >
Deduces selected_field_ids, and the valid format from input and sets sam_file_output::ref_ids_type to...
sam_file_output(std::filesystem::path const &filename, ref_ids_type_ &&ref_ids, ref_lengths_type &&ref_lengths, selected_field_ids const &fields_tag=selected_field_ids{})
Construct from filename.
Definition: output.hpp:365
auto & header()
Access the file's header.
Definition: output.hpp:689
friend sam_file_output operator|(rng_t &&range, sam_file_output &&f)
This is an overloaded member function, provided for convenience. It differs from the above function o...
Definition: output.hpp:657
sam_file_output(std::filesystem::path const &, ref_ids_type &&, ref_lengths_type &&, selected_field_ids const &) -> sam_file_output< selected_field_ids, typename sam_file_output<>::valid_formats, std::remove_reference_t< ref_ids_type > >
Deduces selected_field_ids and ref_ids_type from input. valid_formats is set to the default.
void const_iterator
The const iterator type is void, because files are not const-iterable.
Definition: output.hpp:219
sam_file_output(stream_type &, file_format const &) -> sam_file_output< typename sam_file_output<>::selected_field_ids, type_list< file_format >, ref_info_not_given >
Deduces the valid format from input and sets sam_file_output::ref_ids_type to seqan3::detail::ref_inf...
The SAM tag dictionary class that stores all optional SAM fields.
Definition: sam_tag_dictionary.hpp:334
This header includes C++17 filesystem support and imports it into namespace std::filesystem (independ...
@ none
None of the flags below are set.
field
An enumerator for the fields used in file formats.
Definition: record.hpp:63
@ flag
The alignment flag (bit information), uint16_t value.
@ ref_offset
Sequence (seqan3::field::ref_seq) relative start position (0-based), unsigned value.
@ ref_seq
The (reference) "sequence" information, usually a range of nucleotides or amino acids.
@ alignment
The (pairwise) alignment stored in an object that models seqan3::detail::pairwise_alignment.
@ cigar
The cigar vector (std::vector<seqan3::cigar>) representing the alignment in SAM/BAM format.
@ mapq
The mapping quality of the seqan3::field::seq alignment, usually a Phred-scaled score.
@ bit_score
The bit score (statistical significance indicator), unsigned value.
@ offset
Sequence (seqan3::field::seq) relative start position (0-based), unsigned value.
@ mate
The mate pair information given as a std::tuple of reference name, offset and template length.
@ header_ptr
A pointer to the seqan3::sam_file_header object storing header information.
@ ref_id
The identifier of the (reference) sequence that seqan3::field::seq was aligned to.
@ evalue
The e-value (length normalized bit score), double value.
@ id
The identifier, usually a string.
@ tags
The optional tags in the SAM format, stored in a dictionary.
@ seq
The "sequence", usually a range of nucleotides or amino acids.
@ qual
The qualities, usually in Phred score notation.
constexpr size_t size
The size of a type pack.
Definition: traits.hpp:151
Whether a type behaves like a tuple.
Provides exceptions used in the I/O module.
Provides various utility functions required only for output.
The main SeqAn3 namespace.
Definition: cigar_operation_table.hpp:2
Provides the seqan3::detail::out_file_iterator class template.
Adaptations of concepts from the Ranges TS.
Provides the seqan3::record template and the seqan3::field enum.
Provides seqan3::detail::record_like.
Provides seqan3::sam_file_output_options.
Provides helper data structures for the seqan3::sam_file_output.
A class template that holds a choice of seqan3::field.
Definition: record.hpp:128
The class template that file records are based on; behaves like an std::tuple.
Definition: record.hpp:191
Type tag which indicates that no reference information has been passed to the alignment file on const...
Definition: sam_flag.hpp:24
The options type defines various option members that influence the behavior of all or some formats.
Definition: output_options.hpp:23
Type that contains multiple types.
Definition: type_list.hpp:29
Provides traits for seqan3::type_list.
Provides seqan3::tuple_like.