Chopper
All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Pages
configuration.hpp
Go to the documentation of this file.
1// ---------------------------------------------------------------------------------------------------
2// Copyright (c) 2006-2023, Knut Reinert & Freie Universität Berlin
3// Copyright (c) 2016-2023, Knut Reinert & MPI für molekulare Genetik
4// This file may be used, modified and/or redistributed under the terms of the 3-clause BSD-License
5// shipped with this file and also available at: https://github.com/seqan/chopper/blob/main/LICENSE.md
6// ---------------------------------------------------------------------------------------------------
7
8#pragma once
9
10#include <cinttypes>
11#include <filesystem>
12#include <iosfwd>
13
14#include <cereal/cereal.hpp>
15
16#include <hibf/cereal/path.hpp> // IWYU pragma: keep
17#include <hibf/config.hpp>
18#include <hibf/misc/timer.hpp>
19
20namespace chopper
21{
22
24{
29 std::filesystem::path data_file;
30
32 bool debug{false};
33
35 std::filesystem::path output_filename{"layout.txt"};
36
38 std::filesystem::path output_timings{};
39
41 uint8_t k{19};
42
44 uint8_t window_size{k};
45
47 bool precomputed_files{false};
49
54 std::filesystem::path sketch_directory{};
55
59
65
67 bool force_all_binnings{false};
68
72
74 seqan::hibf::config hibf_config;
75
76 mutable seqan::hibf::concurrent_timer compute_sketches_timer{};
77 mutable seqan::hibf::concurrent_timer union_estimation_timer{};
78 mutable seqan::hibf::concurrent_timer rearrangement_timer{};
79 mutable seqan::hibf::concurrent_timer dp_algorithm_timer{};
80
81 void read_from(std::istream & stream);
82
83 void write_to(std::ostream & stream) const;
84
85private:
86 friend class cereal::access;
87
88 template <typename archive_t>
89 void serialize(archive_t & archive)
90 {
91 uint32_t version{2};
92 archive(CEREAL_NVP(version));
93
94 archive(CEREAL_NVP(data_file));
95 archive(CEREAL_NVP(debug));
96 archive(CEREAL_NVP(sketch_directory));
97 archive(CEREAL_NVP(k));
98 archive(CEREAL_NVP(window_size));
99 archive(CEREAL_NVP(disable_sketch_output));
100 archive(CEREAL_NVP(precomputed_files));
101
102 archive(CEREAL_NVP(output_filename));
103 archive(CEREAL_NVP(determine_best_tmax));
104 archive(CEREAL_NVP(force_all_binnings));
105 }
106};
107
108} // namespace chopper
Definition: adjust_seed.hpp:18
Definition: configuration.hpp:24
std::filesystem::path sketch_directory
The name for the output directory when writing sketches to disk.
Definition: configuration.hpp:54
seqan::hibf::config hibf_config
The HIBF config which will be used to compute the layout within the HIBF lib.
Definition: configuration.hpp:74
uint8_t window_size
The window size to compute minimizers before computing a HyperLogLog sketch from them.
Definition: configuration.hpp:44
std::filesystem::path output_filename
The name of the layout file to write.
Definition: configuration.hpp:35
void write_to(std::ostream &stream) const
Definition: configuration.cpp:46
seqan::hibf::concurrent_timer rearrangement_timer
Definition: configuration.hpp:78
seqan::hibf::concurrent_timer union_estimation_timer
Definition: configuration.hpp:77
seqan::hibf::concurrent_timer compute_sketches_timer
Definition: configuration.hpp:76
bool precomputed_files
Whether the input files are precomputed files (.minimiser) instead of sequence files.
Definition: configuration.hpp:47
uint8_t k
The kmer size to hash the input sequences before computing a HyperLogLog sketch from them.
Definition: configuration.hpp:41
bool determine_best_tmax
Whether the program should determine the best number of IBF bins by doing multiple binning runs.
Definition: configuration.hpp:64
seqan::hibf::concurrent_timer dp_algorithm_timer
Definition: configuration.hpp:79
std::filesystem::path output_timings
If specified, layout timings are written to the specified file.
Definition: configuration.hpp:38
bool force_all_binnings
Whether the programm should compute all binnings up to the given t_max.
Definition: configuration.hpp:67
friend class cereal::access
Definition: configuration.hpp:86
void read_from(std::istream &stream)
Definition: configuration.cpp:21
std::filesystem::path data_file
The input file to chopper. Should contain one file path per line.
Definition: configuration.hpp:29
bool output_verbose_statistics
Whether to print verbose output when computing the statistics when computing the layout.
Definition: configuration.hpp:70
void serialize(archive_t &archive)
Definition: configuration.hpp:89
bool debug
Internal parameter that triggers some verbose debug output.
Definition: configuration.hpp:32
bool disable_sketch_output
Do not write the sketches into a dedicated directory.
Definition: configuration.hpp:57