GEDLIB  1.0
test_misc_methods.cpp
Go to the documentation of this file.
1 /***************************************************************************
2  * *
3  * Copyright (C) 2018 by David B. Blumenthal *
4  * *
5  * This file is part of GEDLIB. *
6  * *
7  * GEDLIB is free software: you can redistribute it and/or modify it *
8  * under the terms of the GNU Lesser General Public License as published *
9  * by the Free Software Foundation, either version 3 of the License, or *
10  * (at your option) any later version. *
11  * *
12  * GEDLIB is distributed in the hope that it will be useful, *
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of *
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the *
15  * GNU Lesser General Public License for more details. *
16  * *
17  * You should have received a copy of the GNU Lesser General Public *
18  * License along with GEDLIB. If not, see <http://www.gnu.org/licenses/>. *
19  * *
20  ***************************************************************************/
21 
31 #include "util.hpp"
32 
33 class Method {
34 private:
35  // method and options
36  ged::Options::GEDMethod ged_method_;
37 
38 
39  std::string options_() const {
40  std::string options("");
42  options += "--threads 6";
43  }
44  if (ged_method_ == ged::Options::GEDMethod::HYBRID) {
45  options += " --time-limit 1";
46  }
47  return options;
48  }
49 
50 public:
51  Method(ged::Options::GEDMethod ged_method) :
52  ged_method_{ged_method} {}
53 
54  std::string name() const {
55  std::stringstream name;
56  if (ged_method_ == ged::Options::GEDMethod::BRANCH_COMPACT) {
57  name << "BRANCHCOMPACT";
58  }
59  else if (ged_method_ == ged::Options::GEDMethod::PARTITION) {
60  name << "PARTITION";
61  }
62  else if (ged_method_ == ged::Options::GEDMethod::SIMULATED_ANNEALING) {
63  name << "SA";
64  }
65  else if (ged_method_ == ged::Options::GEDMethod::HYBRID) {
66  name << "HYBRID";
67  }
68  else if (ged_method_ == ged::Options::GEDMethod::BRANCH_TIGHT) {
69  name << "BRANCHTIGHT";
70  }
71  else if (ged_method_ == ged::Options::GEDMethod::HED) {
72  name << "HED";
73  }
74  return name.str();
75  }
76 
77  void run_on_dataset(const std::string & dataset, ged::GEDEnv<ged::GXLNodeID, ged::GXLLabel, ged::GXLLabel> & env, double & avg_lb, double & avg_ub, double & avg_runtime,
78  double & classification_coefficient_lb, double & classification_coefficient_ub) const {
79  env.set_method(ged_method_, options_());
80  if (dataset != "Protein" or ged_method_ != ged::Options::GEDMethod::PARTITION) {
81  env.init_method();
82  }
83  std::size_t num_runs{env.graph_ids().second * env.graph_ids().second};
84  ged::ProgressBar progress_bar(num_runs);
85  std::cout << "\r\t" << name() << ": " << progress_bar << std::flush;
86  std::size_t num_intra_class_runs{0};
87  std::size_t num_inter_class_runs{0};
88  double largest_lb{0.0};
89  double avg_intra_class_lb{0.0};
90  double avg_inter_class_lb{0.0};
91  double largest_ub{0.0};
92  double avg_intra_class_ub{0.0};
93  double avg_inter_class_ub{0.0};
94  avg_runtime = 0;
95  avg_ub = 0;
96  avg_lb = 0;
97  for (ged::GEDGraph::GraphID g_id = env.graph_ids().first; g_id != env.graph_ids().second; g_id++) {
98  for (ged::GEDGraph::GraphID h_id = env.graph_ids().first; h_id != env.graph_ids().second; h_id++) {
99  env.run_method(g_id, h_id);
100  avg_lb += env.get_lower_bound(g_id, h_id);
101  avg_ub += env.get_upper_bound(g_id, h_id);
102  avg_runtime += env.get_runtime(g_id, h_id);
103  if (env.get_lower_bound(g_id, h_id) > largest_lb) {
104  largest_lb = env.get_lower_bound(g_id, h_id);
105  }
106  if (env.get_upper_bound(g_id, h_id) > largest_ub) {
107  largest_ub = env.get_upper_bound(g_id, h_id);
108  }
109  if (env.get_graph_class(g_id) == env.get_graph_class(h_id)) {
110  avg_intra_class_lb += env.get_lower_bound(g_id, h_id);
111  avg_intra_class_ub += env.get_upper_bound(g_id, h_id);
112  num_intra_class_runs++;
113  }
114  else {
115  avg_inter_class_lb += env.get_lower_bound(g_id, h_id);
116  avg_inter_class_ub += env.get_upper_bound(g_id, h_id);
117  num_inter_class_runs++;
118  }
119  progress_bar.increment();
120  std::cout << "\r\t" << name() << ": " << progress_bar << std::flush;
121  }
122  }
123  avg_lb /= static_cast<double>(num_runs);
124  avg_ub /= static_cast<double>(num_runs);
125  avg_runtime /= static_cast<double>(num_runs);
126  avg_intra_class_lb /= static_cast<double>(num_intra_class_runs);
127  avg_intra_class_ub /= static_cast<double>(num_intra_class_runs);
128  avg_inter_class_lb /= static_cast<double>(num_inter_class_runs);
129  avg_inter_class_ub /= static_cast<double>(num_inter_class_runs);
130  if (largest_lb > 0) {
131  classification_coefficient_lb = (avg_inter_class_lb - avg_intra_class_lb) / largest_lb;
132  }
133  else {
134  classification_coefficient_lb = 0;
135  }
136  if (largest_ub > 0) {
137  classification_coefficient_ub = (avg_inter_class_ub - avg_intra_class_ub) / largest_ub;
138  }
139  else {
140  classification_coefficient_ub = 0;
141  }
142  std::cout << "\n";
143  }
144 };
145 
146 
147 void test_on_dataset(const std::string & dataset) {
148 
149  // Initialize environment.
150  std::cout << "\n=== " << dataset << " ===\n";
151  std::cout << "\tInitializing the environment ...\n";
153  util::setup_environment(dataset, false, env);
154 
155  // Collect all tested methods.
157  std::vector<Method> methods;
158  for (auto ged_method : ged_methods) {
159  methods.emplace_back(ged_method);
160  }
161 
162  // Run the tests.
163  std::string result_filename("../results/");
164  result_filename += dataset + "__misc_methods.csv";
165  std::ofstream result_file(result_filename.c_str());
166  result_file << "method;avg_lb;avg_ub;avg_runtime;classification_coefficient_lb;classification_coefficient_ub\n";
167  result_file.close();
168  double avg_ub{0};
169  double avg_lb{0};
170  double avg_runtime{0};
171  double classification_coefficient_lb{0};
172  double classification_coefficient_ub{0};
173  for (auto & method : methods) {
174  method.run_on_dataset(dataset, env, avg_lb, avg_ub, avg_runtime, classification_coefficient_lb, classification_coefficient_ub);
175  result_file.open(result_filename.c_str(),std::ios_base::app);
176  result_file << method.name() << ";" << avg_lb << ";" << avg_ub << ";" << avg_runtime << ";" << classification_coefficient_lb << ";" << classification_coefficient_ub << "\n";
177  result_file.close();
178  }
179 }
180 
181 int main(int argc, char* argv[]) {
182  std::vector<std::string> datasets;
183  for (int i{1}; i < argc; i++) {
184  datasets.push_back(std::string(argv[i]));
185  util::check_dataset(datasets.back());
186  }
187  if (datasets.empty()) {
188  util::setup_datasets(datasets);
189  }
190  for (auto dataset : datasets) {
191  try {
192  test_on_dataset(dataset);
193  }
194  catch (const std::exception & error) {
195  std::cerr << error.what() << ". " << "Error on " << dataset << ".\n";
196  }
197  }
198  return 0;
199 }
200 
201 
202 
Provides utility functions for tests of VLDB J. submission.
std::pair< GEDGraph::GraphID, GEDGraph::GraphID > graph_ids() const
Provides access to the IDs of the graphs contained in the environment.
Definition: ged_env.ipp:507
std::vector< GEDGraph >::size_type GraphID
Type of internally used graph IDs.
Definition: ged_graph.hpp:112
void init_method()
Initializes the method specified by call to set_method().
Definition: ged_env.ipp:521
GEDMethod
Selects the method.
const std::string & get_graph_class(GEDGraph::GraphID graph_id) const
Returns the graph class.
Definition: ged_env.ipp:578
Selects ged::BranchTight.
double get_runtime(GEDGraph::GraphID g_id, GEDGraph::GraphID h_id) const
Returns runtime.
Definition: ged_env.ipp:567
Selects ged::Partition.
A progress bar class.
Selects ged::SimulatedAnnealing.
double get_upper_bound(GEDGraph::GraphID g_id, GEDGraph::GraphID h_id) const
Returns upper bound for edit distance between the input graphs.
Definition: ged_env.ipp:545
void run_method(GEDGraph::GraphID g_id, GEDGraph::GraphID h_id)
Runs the GED method specified by call to set_method() between the graphs with IDs g_id and h_id...
Definition: ged_env.ipp:471
void set_method(Options::GEDMethod method, const std::string &options=std::string(""))
Sets the GEDMethod to be used by run_method().
Definition: ged_env.ipp:384
Selects ged::Hybrid.
double get_lower_bound(GEDGraph::GraphID g_id, GEDGraph::GraphID h_id) const
Returns lower bound for edit distance between the input graphs.
Definition: ged_env.ipp:534
Provides the API of GEDLIB.
Definition: ged_data.hpp:48
Selects ged::BranchCompact.