1// -----------------------------------------------------------------------------------------------------
2// Copyright (c) 2006-2022, Knut Reinert & Freie Universität Berlin
3// Copyright (c) 2016-2022, Knut Reinert & MPI für molekulare Genetik
4// This file may be used, modified and/or redistributed under the terms of the 3-clause BSD-License
5// shipped with this file and also available at:
6// -----------------------------------------------------------------------------------------------------
13#pragma once
15#include <cassert>
16#include <filesystem>
17#include <fstream>
18#include <optional>
19#include <ranges>
20#include <string>
21#include <type_traits>
22#include <variant>
23#include <vector>
27#include <seqan3/io/detail/record.hpp>
30#include <seqan3/io/record.hpp>
41namespace seqan3
44// ----------------------------------------------------------------------------
45// structure_file_output
46// ----------------------------------------------------------------------------
60template <detail::fields_specialisation selected_field_ids_ = fields<field::seq, field::id, field::structure>,
61 detail::type_list_of_structure_file_output_formats valid_formats_ = type_list<format_vienna>>
70 using selected_field_ids = selected_field_ids_;
72 using valid_formats = valid_formats_;
74 using stream_char_type = char;
89 static_assert(
90 []() constexpr {
91 for (field f : selected_field_ids::as_array)
92 if (!field_ids::contains(f))
93 return false;
94 return true;
95 }(),
96 "You selected a field that is not valid for structure files, please refer to the documentation "
97 "of structure_file_output::field_ids for the accepted values.");
99 static_assert(
100 []() constexpr {
101 return !(selected_field_ids::contains(field::structured_seq)
102 && (selected_field_ids::contains(field::seq) || (selected_field_ids::contains(field::structure))));
103 }(),
104 "You may not select field::structured_seq and either of field::seq and field::structure "
105 "at the same time.");
113 using value_type = void;
115 using reference = void;
117 using const_reference = void;
119 using size_type = void;
123 using iterator = detail::out_file_iterator<structure_file_output>;
125 using const_iterator = void;
127 using sentinel = std::default_sentinel_t;
162 selected_field_ids const & SEQAN3_DOXYGEN_ONLY(fields_tag) = selected_field_ids{}) :
163 primary_stream{new std::ofstream{}, stream_deleter_default}
164 {
165 primary_stream->rdbuf()->pubsetbuf(, stream_buffer.size());
166 static_cast<std::basic_ofstream<char> *>(primary_stream.get())
167 ->open(filename, std::ios_base::out | std::ios::binary);
169 if (!primary_stream->good())
170 throw file_open_error{"Could not open file " + filename.string() + " for writing."};
172 // possibly add intermediate compression stream
173 secondary_stream = detail::make_secondary_ostream(*primary_stream, filename);
175 // initialise format handler or throw if format is not found
176 detail::set_format(format, filename);
177 }
195 template <output_stream stream_t, structure_file_output_format file_format>
196 requires std::same_as<typename std::remove_reference_t<stream_t>::char_type, char>
197 structure_file_output(stream_t & stream,
198 file_format const & SEQAN3_DOXYGEN_ONLY(format_tag),
199 selected_field_ids const & SEQAN3_DOXYGEN_ONLY(fields_tag) = selected_field_ids{}) :
200 primary_stream{&stream, stream_deleter_noop},
201 secondary_stream{&stream, stream_deleter_noop},
202 format{detail::structure_file_output_format_exposer<file_format>{}}
203 {
204 static_assert(list_traits::contains<file_format, valid_formats>,
205 "You selected a format that is not in the valid_formats of this file.");
206 }
209 template <output_stream stream_t, structure_file_output_format file_format>
210 requires std::same_as<typename std::remove_reference_t<stream_t>::char_type, char>
211 structure_file_output(stream_t && stream,
212 file_format const & SEQAN3_DOXYGEN_ONLY(format_tag),
213 selected_field_ids const & SEQAN3_DOXYGEN_ONLY(fields_tag) = selected_field_ids{}) :
214 primary_stream{new stream_t{std::move(stream)}, stream_deleter_default},
215 secondary_stream{&*primary_stream, stream_deleter_noop},
216 format{detail::structure_file_output_format_exposer<file_format>{}}
217 {
218 static_assert(list_traits::contains<file_format, valid_formats>,
219 "You selected a format that is not in the valid_formats of this file.");
220 }
244 iterator begin() noexcept
245 {
246 return {*this};
247 }
263 sentinel end() noexcept
264 {
265 return {};
266 }
286 template <typename record_t>
287 void push_back(record_t && r)
288 requires detail::record_like<record_t>
289 {
290 write_record(detail::get_or_ignore<field::seq>(r),
291 detail::get_or_ignore<field::id>(r),
292 detail::get_or_ignore<field::bpp>(r),
293 detail::get_or_ignore<field::structure>(r),
294 detail::get_or_ignore<field::structured_seq>(r),
295 detail::get_or_ignore<field::energy>(r),
296 detail::get_or_ignore<field::react>(r),
297 detail::get_or_ignore<field::react_err>(r),
298 detail::get_or_ignore<field::comment>(r),
299 detail::get_or_ignore<field::offset>(r));
300 }
323 template <typename tuple_t>
324 void push_back(tuple_t && t)
325 requires tuple_like<tuple_t> && (!detail::record_like<tuple_t>)
326 {
327 // index_of might return npos, but this will be handled well by get_or_ignore (and just return ignore)
328 write_record(detail::get_or_ignore<selected_field_ids::index_of(field::seq)>(t),
329 detail::get_or_ignore<selected_field_ids::index_of(field::id)>(t),
330 detail::get_or_ignore<selected_field_ids::index_of(field::bpp)>(t),
331 detail::get_or_ignore<selected_field_ids::index_of(field::structure)>(t),
332 detail::get_or_ignore<selected_field_ids::index_of(field::structured_seq)>(t),
333 detail::get_or_ignore<selected_field_ids::index_of(field::energy)>(t),
334 detail::get_or_ignore<selected_field_ids::index_of(field::react)>(t),
335 detail::get_or_ignore<selected_field_ids::index_of(field::react_err)>(t),
336 detail::get_or_ignore<selected_field_ids::index_of(field::comment)>(t),
337 detail::get_or_ignore<selected_field_ids::index_of(field::offset)>(t));
338 }
363 template <typename arg_t, typename... arg_types>
364 void emplace_back(arg_t && arg, arg_types &&... args)
365 {
366 push_back(std::tie(arg, args...));
367 }
390 template <std::ranges::input_range rng_t>
393 {
394 for (auto && record : range)
395 push_back(std::forward<decltype(record)>(record));
396 return *this;
397 }
426 template <std::ranges::input_range rng_t>
429 {
430 f = range;
431 return f;
432 }
435 template <std::ranges::input_range rng_t>
438 {
439 f = range;
440 return std::move(f);
441 }
451 {
452 return *secondary_stream;
453 }
459 std::vector<char> stream_buffer{std::vector<char>(1'000'000)};
468 static void stream_deleter_noop(std::basic_ostream<stream_char_type> *)
469 {}
471 static void stream_deleter_default(std::basic_ostream<stream_char_type> * ptr)
472 {
473 delete ptr;
474 }
477 stream_ptr_t primary_stream{nullptr, stream_deleter_noop};
479 stream_ptr_t secondary_stream{nullptr, stream_deleter_noop};
482 using format_type =
483 typename detail::variant_from_tags<valid_formats, detail::structure_file_output_format_exposer>::type;
485 format_type format;
489 template <typename seq_type,
490 typename id_type,
491 typename bpp_type,
492 typename structure_type,
493 typename structured_seq_type,
494 typename energy_type,
495 typename react_type,
496 typename comment_type,
497 typename offset_type>
498 void write_record(seq_type && seq,
499 id_type && id,
500 bpp_type && bpp,
501 structure_type && structure,
502 structured_seq_type && structured_seq,
503 energy_type && energy,
504 react_type && react,
505 react_type && react_error,
506 comment_type && comment,
507 offset_type && offset)
508 {
509 static_assert(detail::decays_to_ignore_v<structured_seq_type>
510 || (detail::decays_to_ignore_v<seq_type> && detail::decays_to_ignore_v<structure_type>),
511 "You may not select field::structured_seq and either of field::seq and field::structure "
512 "at the same time.");
514 assert(!format.valueless_by_exception());
516 [&](auto & f)
517 {
518 if constexpr (!detail::decays_to_ignore_v<structured_seq_type>)
519 {
520 f.write_structure_record(*secondary_stream,
521 options,
522 structured_seq | views::elements<0>,
523 id,
524 bpp,
525 structured_seq | views::elements<1>,
526 energy,
527 react,
528 react_error,
529 comment,
530 offset);
531 }
532 else
533 {
534 f.write_structure_record(*secondary_stream,
535 options,
536 seq,
537 id,
538 bpp,
539 structure,
540 energy,
541 react,
542 react_error,
543 comment,
544 offset);
545 }
546 },
547 format);
548 }
551 friend iterator;
560template <output_stream stream_t,
561 structure_file_output_format file_format,
562 detail::fields_specialisation selected_field_ids>
563structure_file_output(stream_t &&, file_format const &, selected_field_ids const &)
567template <output_stream stream_t,
569 detail::fields_specialisation selected_field_ids>
570structure_file_output(stream_t &, file_format const &, selected_field_ids const &)
574} // namespace seqan3
