GEDLIB  1.0
test_lp_based_methods.cpp
Go to the documentation of this file.
1 /***************************************************************************
2  * *
3  * Copyright (C) 2018 by David B. Blumenthal *
4  * *
5  * This file is part of GEDLIB. *
6  * *
7  * GEDLIB is free software: you can redistribute it and/or modify it *
8  * under the terms of the GNU Lesser General Public License as published *
9  * by the Free Software Foundation, either version 3 of the License, or *
10  * (at your option) any later version. *
11  * *
12  * GEDLIB is distributed in the hope that it will be useful, *
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of *
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the *
15  * GNU Lesser General Public License for more details. *
16  * *
17  * You should have received a copy of the GNU Lesser General Public *
18  * License along with GEDLIB. If not, see <http://www.gnu.org/licenses/>. *
19  * *
20  ***************************************************************************/
21 
31 #include "util.hpp"
32 
33 class Method {
34 private:
35  // method and options
36  ged::Options::GEDMethod ged_method_;
37 
38 
39  std::string options_() const {
40  return "--threads 6 --relax TRUE";
41  }
42 
43 public:
44  Method(ged::Options::GEDMethod ged_method) :
45  ged_method_{ged_method} {}
46 
47  std::string name() const {
48  std::stringstream name;
49  if (ged_method_ == ged::Options::GEDMethod::F1) {
50  name << "FONE";
51  }
52  else if (ged_method_ == ged::Options::GEDMethod::F2) {
53  name << "FTWO";
54  }
55  else if (ged_method_ == ged::Options::GEDMethod::COMPACT_MIP) {
56  name << "COMPACTMIP";
57  }
58  else if (ged_method_ == ged::Options::GEDMethod::BLP_NO_EDGE_LABELS) {
59  name << "JUSTICEIP";
60  }
61  return name.str();
62  }
63 
64  void run_on_dataset(const std::string & dataset, ged::GEDEnv<ged::GXLNodeID, ged::GXLLabel, ged::GXLLabel> & env, double & avg_lb, double & avg_ub, double & avg_runtime,
65  double & classification_coefficient_lb, double & classification_coefficient_ub) const {
66  env.set_method(ged_method_, options_());
67  env.init_method();
68  std::size_t num_runs{env.graph_ids().second * env.graph_ids().second};
69  ged::ProgressBar progress_bar(num_runs);
70  std::cout << "\r\t" << name() << ": " << progress_bar << std::flush;
71  std::size_t num_intra_class_runs{0};
72  std::size_t num_inter_class_runs{0};
73  double largest_lb{0.0};
74  double avg_intra_class_lb{0.0};
75  double avg_inter_class_lb{0.0};
76  double largest_ub{0.0};
77  double avg_intra_class_ub{0.0};
78  double avg_inter_class_ub{0.0};
79  avg_runtime = 0;
80  avg_ub = 0;
81  avg_lb = 0;
82  for (ged::GEDGraph::GraphID g_id = env.graph_ids().first; g_id != env.graph_ids().second; g_id++) {
83  for (ged::GEDGraph::GraphID h_id = env.graph_ids().first; h_id != env.graph_ids().second; h_id++) {
84  env.run_method(g_id, h_id);
85  avg_lb += env.get_lower_bound(g_id, h_id);
86  avg_ub += env.get_upper_bound(g_id, h_id);
87  avg_runtime += env.get_runtime(g_id, h_id);
88  if (env.get_lower_bound(g_id, h_id) > largest_lb) {
89  largest_lb = env.get_lower_bound(g_id, h_id);
90  }
91  if (env.get_upper_bound(g_id, h_id) > largest_ub) {
92  largest_ub = env.get_upper_bound(g_id, h_id);
93  }
94  if (env.get_graph_class(g_id) == env.get_graph_class(h_id)) {
95  avg_intra_class_lb += env.get_lower_bound(g_id, h_id);
96  avg_intra_class_ub += env.get_upper_bound(g_id, h_id);
97  num_intra_class_runs++;
98  }
99  else {
100  avg_inter_class_lb += env.get_lower_bound(g_id, h_id);
101  avg_inter_class_ub += env.get_upper_bound(g_id, h_id);
102  num_inter_class_runs++;
103  }
104  progress_bar.increment();
105  std::cout << "\r\t" << name() << ": " << progress_bar << std::flush;
106  }
107  }
108  avg_lb /= static_cast<double>(num_runs);
109  avg_ub /= static_cast<double>(num_runs);
110  avg_runtime /= static_cast<double>(num_runs);
111  avg_intra_class_lb /= static_cast<double>(num_intra_class_runs);
112  avg_intra_class_ub /= static_cast<double>(num_intra_class_runs);
113  avg_inter_class_lb /= static_cast<double>(num_inter_class_runs);
114  avg_inter_class_ub /= static_cast<double>(num_inter_class_runs);
115  if (largest_lb > 0) {
116  classification_coefficient_lb = (avg_inter_class_lb - avg_intra_class_lb) / largest_lb;
117  }
118  else {
119  classification_coefficient_lb = 0;
120  }
121  if (largest_ub > 0) {
122  classification_coefficient_ub = (avg_inter_class_ub - avg_intra_class_ub) / largest_ub;
123  }
124  else {
125  classification_coefficient_ub = 0;
126  }
127  std::cout << "\n";
128  }
129 };
130 
131 
132 void test_on_dataset(const std::string & dataset) {
133 
134  // Initialize environment.
135  std::cout << "\n=== " << dataset << " ===\n";
136  std::cout << "\tInitializing the environment ...\n";
138  util::setup_environment(dataset, false, env);
139 
140  // Collect all tested methods.
141  std::vector<ged::Options::GEDMethod> ged_methods{ged::Options::GEDMethod::F1, ged::Options::GEDMethod::F2, ged::Options::GEDMethod::COMPACT_MIP, ged::Options::GEDMethod::BLP_NO_EDGE_LABELS};
142  std::vector<Method> methods;
143  for (auto ged_method : ged_methods) {
144  methods.emplace_back(ged_method);
145  }
146 
147  // Run the tests.
148  std::string result_filename("../results/");
149  result_filename += dataset + "__lp_based_methods.csv";
150  std::ofstream result_file(result_filename.c_str());
151  result_file << "method;avg_lb;avg_ub;avg_runtime;classification_coefficient_lb;classification_coefficient_ub\n";
152  result_file.close();
153  double avg_ub{0};
154  double avg_lb{0};
155  double avg_runtime{0};
156  double classification_coefficient_lb{0};
157  double classification_coefficient_ub{0};
158  for (auto & method : methods) {
159  method.run_on_dataset(dataset, env, avg_lb, avg_ub, avg_runtime, classification_coefficient_lb, classification_coefficient_ub);
160  result_file.open(result_filename.c_str(),std::ios_base::app);
161  result_file << method.name() << ";" << avg_lb << ";" << avg_ub << ";" << avg_runtime << ";" << classification_coefficient_lb << ";" << classification_coefficient_ub << "\n";
162  result_file.close();
163  }
164 }
165 
166 int main(int argc, char* argv[]) {
167  std::vector<std::string> datasets;
168  for (int i{1}; i < argc; i++) {
169  datasets.push_back(std::string(argv[i]));
170  util::check_dataset(datasets.back());
171  }
172  if (datasets.empty()) {
173  util::setup_datasets(datasets);
174  }
175  for (auto dataset : datasets) {
176  try {
177  test_on_dataset(dataset);
178  }
179  catch (const std::exception & error) {
180  std::cerr << error.what() << ". " << "Error on " << dataset << ".\n";
181  }
182  }
183  return 0;
184 }
185 
186 
187 
Provides utility functions for tests of VLDB J. submission.
std::pair< GEDGraph::GraphID, GEDGraph::GraphID > graph_ids() const
Provides access to the IDs of the graphs contained in the environment.
Definition: ged_env.ipp:507
std::vector< GEDGraph >::size_type GraphID
Type of internally used graph IDs.
Definition: ged_graph.hpp:112
void init_method()
Initializes the method specified by call to set_method().
Definition: ged_env.ipp:521
GEDMethod
Selects the method.
const std::string & get_graph_class(GEDGraph::GraphID graph_id) const
Returns the graph class.
Definition: ged_env.ipp:578
double get_runtime(GEDGraph::GraphID g_id, GEDGraph::GraphID h_id) const
Returns runtime.
Definition: ged_env.ipp:567
A progress bar class.
double get_upper_bound(GEDGraph::GraphID g_id, GEDGraph::GraphID h_id) const
Returns upper bound for edit distance between the input graphs.
Definition: ged_env.ipp:545
void run_method(GEDGraph::GraphID g_id, GEDGraph::GraphID h_id)
Runs the GED method specified by call to set_method() between the graphs with IDs g_id and h_id...
Definition: ged_env.ipp:471
void set_method(Options::GEDMethod method, const std::string &options=std::string(""))
Sets the GEDMethod to be used by run_method().
Definition: ged_env.ipp:384
double get_lower_bound(GEDGraph::GraphID g_id, GEDGraph::GraphID h_id) const
Returns lower bound for edit distance between the input graphs.
Definition: ged_env.ipp:534
Provides the API of GEDLIB.
Definition: ged_data.hpp:48