forked from cwida/gfe_driver
-
Notifications
You must be signed in to change notification settings - Fork 7
/
Copy pathconfiguration.hpp
250 lines (193 loc) · 12.4 KB
/
configuration.hpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
/**
* Copyright (C) 2019 Dean De Leo, email: dleo[at]cwi.nl
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program. If not, see <https://www.gnu.org/licenses/>.
*/
#pragma once
#include <cinttypes>
#include <iostream>
#include <memory>
#include <mutex>
#include <unordered_map>
#include <utility>
#include <vector>
#include "common/error.hpp"
namespace common { class Database; } // forward declaration
namespace gfe { class Configuration; } // forward declaration
namespace gfe::experiment { struct GraphalyticsAlgorithms; } // forward declaration
namespace gfe::library { class Interface; } // forward declaration
namespace gfe {
// Singleton interface
Configuration& configuration(); // retrieve the current singleton (client, server or standalone)
// Generic configuration error
DEFINE_EXCEPTION(ConfigurationError);
// Print the given message to the standard output
extern std::mutex _log_mutex;
#define LOG( msg ) { std::scoped_lock lock(_log_mutex); std::cout << msg << /* flush immediately */ std::endl; }
// Type of counter for the number of threads
enum ThreadsType { THREADS_READ, THREADS_WRITE, THREADS_TOTAL };
/**
*Global configuration for the driver.
* - Initialise (only one time) the singleton instance through Configuration::initialise(int argc, char* argv[])
* - Access the singleton instance through the function ::configuration();
* The class is not thread safe.
*/
class Configuration {
// remove the copy ctors
Configuration(const Configuration& ) = delete;
Configuration& operator=(const Configuration& ) = delete;
// properties
uint64_t m_aging_cooloff_seconds { 0 }; // cool-off period in the aging experiment, in seconds.
bool m_aging_memfp = false; // whether to measure the memory footprint
bool m_aging_memfp_physical = false; // whether to compute the physical memory or the virtual memory
bool m_aging_memfp_report = false; // whether to print stdout the measurements observed for the memory footprint
uint64_t m_aging_memfp_threshold { 0 }; // forcedly stop the execution of the aging2 experiment if the process is using more memory than this threshold, in bytes
bool m_aging_release_memory = true; // whether to release the memory from the driver as the experiment proceeds
std::vector<std::string> m_blacklist; // list of graph algorithms that cannot be executed
uint64_t m_build_frequency { 0 }; // in the aging experiment, the amount of time that must pass before each invocation to #build(), in milliseconds
double m_coeff_aging { 0.0 }; // coefficient for the additional updates to perform
common::Database* m_database { nullptr }; // handle to the database
std::string m_database_path { "" }; // the path where to store the results
double m_ef_vertices = 1; // expansion factor for the vertices in the graph
double m_ef_edges = 1; // expansion factor for the edges in the graph
bool m_graph_directed = true; // whether the graph is undirected or directed
std::string m_library_name; // the library to test
bool m_load = false; // whether to load the graph in one go
double m_max_weight { 1.0 }; // the maximum weight that can be assigned when reading non weighted graphs
bool m_measure_latency = false; // whether to measure the latency of the update operations (insert/deletion).
uint64_t m_num_repetitions { 0 }; // when applicable, how many times the same experiment should be repeated
int m_num_threads_omp { 0 }; // if different than 0, the max number of threads used by OpenMP
int m_num_threads_read { 0 }; // number of threads to use for the read operations. The value of 0 is the default of OpenMP.
int m_num_threads_write { 1 }; // number of threads to use for the write (insert/update/delete) operations
std::string m_path_graph_to_load; // the file must be accessible to the server
uint64_t m_seed = 5051789ull; // random seed, used in various places in the experiments
double m_step_size_recordings { 1.0 }; // in the aging2 experiment, how often to record the progress done in the db. It must be a value in (0, 1].
uint64_t m_timeout_aging2 { 0 }; // forcedly stop the aging2 experiment after the given amount of seconds
uint64_t m_timeout_graphalytics { 3600 }; // max time to complete a kernel from Graphalytics, in seconds (0 => indefinite)
std::string m_update_log; // aging experiment through the log file
std::unique_ptr<library::Interface> (*m_library_factory)(bool directed) {nullptr} ; // function to retrieve an instance of the library `m_library_name'
std::string m_validate_graph; // validate the results from graphalytics against the given graph
bool m_validate_inserts = false; // whether to validate the edges inserted
bool m_validate_output = false; // whether to validate the execution results of the Graphalytics algorithms
size_t m_block_size = 1024; // Block size for Sortledton to use
bool m_is_mixed_workload = false;
bool m_is_timestamped_graph = false;
void set_aging_cooloff_seconds(uint64_t value);
void set_aging_memfp_threshold(uint64_t bytes);
void set_aging_step_size(double value); // The step in each recording in the progress for the Agin2 experiment. In (0, 1].
void set_build_frequency(uint64_t millisecs);
void set_coeff_aging(double value); // Set the coefficient for `aging', i.e. how many updates (insertions/deletions) to perform w.r.t. to the size of the loaded graph
void set_ef_vertices(double value);
void set_ef_edges(double value);
void set_load(bool value);
void set_num_repetitions(uint64_t value); // Set how many times to repeat the Graphalytics suite of algorithms
void set_num_threads_omp(int value); // The number of threads created by an OpenMP master
void set_num_threads_read(int value); // Set the number of threads to use in the read operations.
void set_num_threads_write(int value); // Set the number of threads to use in the write operations.
void set_timeout_aging2(uint64_t seconds); // Set the maximum amount of time (excl. cool-off time) to run the Aging2 experiment
void set_timeout_graphalytics(uint64_t seconds); // Set the timeout property
void set_graph(const std::string& graph); // Set the graph to load and run the experiments
void set_block_size(size_t block_size);
void set_is_timestamped(bool timestamped);
// Set the path to the database
void set_database_path(const std::string& path){ m_database_path = path; }
// The max weight that can be assigned by graph readers when parsing a non weighted graph
void set_max_weight(double value);
// Set the property seed
void set_seed(uint64_t value){ m_seed = value; }
// Check whether the given property has been blacklisted
void do_blacklist(bool& property_enabled, const char* property_name) const;
public:
// Default configuration
Configuration();
// Destructor
~Configuration();
// Initialise the configuration with the arguments provided by the user
void initialise(int argc, char* argv[]);
// Retrieve the name of the library to evaluate
const std::string& get_library_name() const { return m_library_name; }
// Path to the graphlog with the updates to perform (aging2 experiment)
const std::string& get_update_log() const { return m_update_log; }
// Generate an instance of the graph library to evaluate
std::unique_ptr<library::Interface> generate_graph_library();
// Whether the graph is directed or undirected
bool is_graph_directed() const { return m_graph_directed; }
// Whether to validate the execution results of the Graphalytics algorithms
bool validate_output() const { return m_validate_output; }
// Whether to validate the edges inserted
bool validate_inserts() const { return m_validate_inserts; }
// The path to the graph with the results to validate
const std::string& get_validation_graph() const;
// Coefficient for the surplus of updates to perform (noise) w.r.t. the final graph to load
double coefficient_aging() const{ return m_coeff_aging; }
// The step of each recording in the progress for the Aging2 experiment
double get_aging_step_size() const { return m_step_size_recordings; }
// Number of recordings per operations, in the Aging experiment
uint64_t get_num_recordings_per_ops() const;
// Measure the latency of update operations ?
bool measure_latency() const { return m_measure_latency; }
// Number of repetitions of the same experiment (when applicable)
uint64_t num_repetitions() const { return m_num_repetitions; }
// Get the number of threads to use
int num_threads(ThreadsType type) const;
// Get the max number of threads that an OpenMP master can create
int num_threads_omp() const;
// The path for the graph to load
const std::string& get_path_graph() const { return m_path_graph_to_load; }
// The budget to complete a Graphalytics algorithm, in seconds (e.g. LCC should terminate by get_timeout_graphalytics() seconds)
uint64_t get_timeout_graphalytics() const { return m_timeout_graphalytics; }
// Maximum amount of time to run the Aging2 experiment, in seconds
uint64_t get_timeout_aging2() const { return m_timeout_aging2; }
// Get the expansion factor in the aging experiment for the edges in the graph
double get_ef_edges() const { return m_ef_edges; }
// Get the expansion factor in the aging experiment for the vertices in the graph
double get_ef_vertices() const { return m_ef_vertices; }
// Get the frequency to build a new snapshot, in milliseconds
uint64_t get_build_frequency() const{ return m_build_frequency; }
// Get the cool-off period in the aging experiment. After the experiment terminates, the driver waits for the given
// amount of seconds idle, checking the amount of memory used. The goal is to detect the impact of the garbage
// collector of the evaluated library in reducing the memory footprint when no updates are being executed.
uint64_t get_aging_cooloff_seconds() const { return m_aging_cooloff_seconds; }
// Whether to measure the memory footprint in the aging2 experiment
bool get_aging_memfp() const { return m_aging_memfp; }
bool measure_memfp() const { return get_aging_memfp(); }
// Forcedly stop the execution of the aging2 experiment if the process is using more memory than this threshold, in bytes
uint64_t get_aging_memfp_threshold() const { return m_aging_memfp_threshold; }
// Whether to print to stdout the measurements observed for the memory footprint
bool get_aging_memfp_report() const { return m_aging_memfp_report; }
// Whether to consider the physical memory or the virtual memory in the memory footprint
bool get_aging_memfp_physical() const { return m_aging_memfp_physical; }
// Whether to release the memory from the driver as the experiment proceeds
bool get_aging_release_memory() const { return m_aging_release_memory; }
// Check whether the configuration/results need to be stored into a database
bool has_database() const;
// Whether to load the graph in one go
bool is_load() const;
// Retrieve the handle to the database connection, where the final results of the experiments are stored
::common::Database* db();
// Save the configuration properties into the database
void save_parameters();
// Random seed, used in various places in the experiments
uint64_t seed() const { return m_seed; };
// Get the max weight that can be assigned by the reader to
double max_weight() const { return m_max_weight; }
// Retrieve the path to the database
const std::string& get_database_path() const { return m_database_path; }
// Remove the algorithms blacklisted by the user in the GraphalyticsAlgorithms list
void blacklist(gfe::experiment::GraphalyticsAlgorithms& algorithms) const;
size_t block_size();
bool is_mixed_workload() const;
bool is_timestamped_graph() const;
};
} // namespace