37 std::size_t num_initial_solutions_;
38 double ratio_initial_solutions_;
39 double randpost_penalty_;
40 std::size_t num_randpost_loops_;
41 std::size_t max_swap_size_;
42 std::size_t num_orderings_;
45 std::string options_()
const {
46 std::string options(
"");
47 options +=
"--threads 6 --initial-solutions " + std::to_string(num_initial_solutions_) +
" --ratio-runs-from-initial-solutions " + std::to_string(ratio_initial_solutions_) +
" --num-randpost-loops " + std::to_string(num_randpost_loops_) +
" --randpost-penalty " + std::to_string(randpost_penalty_);
49 options +=
" --max-swap-size " + std::to_string(max_swap_size_);
52 options +=
" --num-orderings " + std::to_string(num_orderings_);
58 Method(
ged::Options::GEDMethod ged_method, std::size_t num_initial_solutions,
double ratio_initial_solutions, std::size_t num_randpost_loops,
double randpost_penalty = 0.0, std::size_t max_swap_size = 2, std::size_t num_orderings = 1) :
59 ged_method_{ged_method},
60 num_initial_solutions_{num_initial_solutions},
61 ratio_initial_solutions_{ratio_initial_solutions},
62 randpost_penalty_{randpost_penalty},
63 num_randpost_loops_{num_randpost_loops},
64 max_swap_size_{max_swap_size},
65 num_orderings_{num_orderings} {}
67 std::string name()
const {
68 std::stringstream name;
70 if (num_orderings_ == 1) {
78 if (max_swap_size_ == 2) {
88 name <<
",$(" << num_initial_solutions_ <<
"," << ratio_initial_solutions_ <<
"," << num_randpost_loops_ <<
"," << randpost_penalty_ <<
")$";
93 double & classification_coefficient_lb,
double & classification_coefficient_ub)
const {
98 std::cout <<
"\r\t" << name() <<
": " << progress_bar << std::flush;
99 std::size_t num_intra_class_runs{0};
100 std::size_t num_inter_class_runs{0};
101 double largest_lb{0.0};
102 double avg_intra_class_lb{0.0};
103 double avg_inter_class_lb{0.0};
104 double largest_ub{0.0};
105 double avg_intra_class_ub{0.0};
106 double avg_inter_class_ub{0.0};
124 num_intra_class_runs++;
129 num_inter_class_runs++;
131 progress_bar.increment();
132 std::cout <<
"\r\t" << name() <<
": " << progress_bar << std::flush;
135 avg_lb /=
static_cast<double>(num_runs);
136 avg_ub /=
static_cast<double>(num_runs);
137 avg_runtime /=
static_cast<double>(num_runs);
138 avg_intra_class_lb /=
static_cast<double>(num_intra_class_runs);
139 avg_intra_class_ub /=
static_cast<double>(num_intra_class_runs);
140 avg_inter_class_lb /=
static_cast<double>(num_inter_class_runs);
141 avg_inter_class_ub /=
static_cast<double>(num_inter_class_runs);
142 if (largest_lb > 0) {
143 classification_coefficient_lb = (avg_inter_class_lb - avg_intra_class_lb) / largest_lb;
146 classification_coefficient_lb = 0;
148 if (largest_ub > 0) {
149 classification_coefficient_ub = (avg_inter_class_ub - avg_intra_class_ub) / largest_ub;
152 classification_coefficient_ub = 0;
158 struct RandpostSetup {
159 std::size_t num_initial_solutions;
160 double ratio_initial_solutions;
161 std::size_t num_randpost_loops;
162 RandpostSetup (std::size_t num_initial_solutions,
double ratio_initial_solutions, std::size_t num_randpost_loops) :
163 num_initial_solutions{num_initial_solutions},
164 ratio_initial_solutions{ratio_initial_solutions},
165 num_randpost_loops{num_randpost_loops} {}
169 void test_on_dataset(
const std::string & dataset,
bool only_refine,
bool only_ipfp,
bool only_bp_beam) {
172 std::cout <<
"\n=== " << dataset <<
" ===\n";
173 std::cout <<
"\tInitializing the environment ...\n";
175 util::setup_environment(dataset,
false, env);
178 std::vector<ged::Options::GEDMethod> ged_methods;
182 else if (only_ipfp) {
185 else if (only_bp_beam) {
191 std::vector<std::size_t> nums_orderings{1, 20};
192 std::vector<std::size_t> max_swap_sizes{2, 3};
193 std::vector<RandpostSetup> randpost_setups;
194 randpost_setups.emplace_back(1, 1, 0);
195 randpost_setups.emplace_back(10, 1, 0);
196 randpost_setups.emplace_back(20, 1, 0);
197 randpost_setups.emplace_back(30, 1, 0);
198 randpost_setups.emplace_back(40, 1, 0);
199 randpost_setups.emplace_back(40, 0.5, 1);
200 randpost_setups.emplace_back(40, 0.25, 3);
201 randpost_setups.emplace_back(40, 0.125, 7);
202 std::vector<double> randpost_penalties{0.0, 1.0};
204 std::vector<Method> methods;
205 for (
auto ged_method : ged_methods) {
206 for (
auto randpost_setup : randpost_setups) {
207 if (randpost_setup.num_randpost_loops > 0) {
208 for (
auto randpost_penalty : randpost_penalties) {
210 for (
auto max_swap_size : max_swap_sizes) {
211 methods.emplace_back(ged_method, randpost_setup.num_initial_solutions, randpost_setup.ratio_initial_solutions, randpost_setup.num_randpost_loops, randpost_penalty, max_swap_size);
215 for (
auto num_orderings : nums_orderings) {
216 methods.emplace_back(ged_method, randpost_setup.num_initial_solutions, randpost_setup.ratio_initial_solutions, randpost_setup.num_randpost_loops, randpost_penalty, 2, num_orderings);
220 methods.emplace_back(ged_method, randpost_setup.num_initial_solutions, randpost_setup.ratio_initial_solutions, randpost_setup.num_randpost_loops, randpost_penalty);
226 for (
auto max_swap_size : max_swap_sizes) {
227 methods.emplace_back(ged_method, randpost_setup.num_initial_solutions, randpost_setup.ratio_initial_solutions, randpost_setup.num_randpost_loops, 0.0, max_swap_size);
231 for (
auto num_orderings : nums_orderings) {
232 methods.emplace_back(ged_method, randpost_setup.num_initial_solutions, randpost_setup.ratio_initial_solutions, randpost_setup.num_randpost_loops, 0.0, 2, num_orderings);
236 methods.emplace_back(ged_method, randpost_setup.num_initial_solutions, randpost_setup.ratio_initial_solutions, randpost_setup.num_randpost_loops);
243 std::string result_filename(
"../results/");
245 result_filename += dataset +
"__ls_based_methods_REFINE.csv";
247 else if (only_ipfp) {
248 result_filename += dataset +
"__ls_based_methods_IPFP.csv";
250 else if (only_bp_beam) {
251 result_filename += dataset +
"__ls_based_methods_BP_BEAM.csv";
254 result_filename += dataset +
"__ls_based_methods.csv";
256 std::ofstream result_file(result_filename.c_str());
257 result_file <<
"method;avg_lb;avg_ub;avg_runtime;classification_coefficient_lb;classification_coefficient_ub\n";
261 double avg_runtime{0};
262 double classification_coefficient_lb{0};
263 double classification_coefficient_ub{0};
264 for (
auto & method : methods) {
265 method.run_on_dataset(dataset, env, avg_lb, avg_ub, avg_runtime, classification_coefficient_lb, classification_coefficient_ub);
266 result_file.open(result_filename.c_str(),std::ios_base::app);
267 result_file << method.name() <<
";" << avg_lb <<
";" << avg_ub <<
";" << avg_runtime <<
";" << classification_coefficient_lb <<
";" << classification_coefficient_ub <<
"\n";
272 int main(
int argc,
char* argv[]) {
274 bool only_refine{
false};
275 bool only_ipfp{
false};
276 bool only_bp_beam{
false};
278 if (std::string(argv[i]) ==
"--refine") {
282 else if (std::string(argv[i]) ==
"--ipfp") {
286 else if (std::string(argv[i]) ==
"--bp-beam") {
291 std::vector<std::string> datasets;
292 for (; i < argc; i++) {
293 datasets.push_back(std::string(argv[i]));
294 util::check_dataset(datasets.back());
296 if (datasets.empty()) {
297 util::setup_datasets(datasets);
299 for (
auto dataset : datasets) {
301 test_on_dataset(dataset, only_refine, only_ipfp, only_bp_beam);
303 catch (
const std::exception & error) {
304 std::cerr << error.what() <<
". " <<
"Error on " << dataset <<
".\n";
Provides utility functions for tests of VLDB J. submission.
std::pair< GEDGraph::GraphID, GEDGraph::GraphID > graph_ids() const
Provides access to the IDs of the graphs contained in the environment.
std::vector< GEDGraph >::size_type GraphID
Type of internally used graph IDs.
void init_method()
Initializes the method specified by call to set_method().
GEDMethod
Selects the method.
const std::string & get_graph_class(GEDGraph::GraphID graph_id) const
Returns the graph class.
double get_runtime(GEDGraph::GraphID g_id, GEDGraph::GraphID h_id) const
Returns runtime.
double get_upper_bound(GEDGraph::GraphID g_id, GEDGraph::GraphID h_id) const
Returns upper bound for edit distance between the input graphs.
void run_method(GEDGraph::GraphID g_id, GEDGraph::GraphID h_id)
Runs the GED method specified by call to set_method() between the graphs with IDs g_id and h_id...
void set_method(Options::GEDMethod method, const std::string &options=std::string(""))
Sets the GEDMethod to be used by run_method().
double get_lower_bound(GEDGraph::GraphID g_id, GEDGraph::GraphID h_id) const
Returns lower bound for edit distance between the input graphs.
Provides the API of GEDLIB.