40 #define GXL_GEDLIB_SHARED 41 #include "../../../src/env/ged_env.hpp" 43 constexpr std::size_t centrality() {
return 20;}
44 constexpr std::size_t no_centrality() {
return 0;}
45 constexpr std::size_t lsape_optimal() {
return 0;}
46 constexpr std::size_t gamma() {
return 40;}
47 constexpr std::size_t lsape_greedy() {
return 80;}
48 constexpr std::size_t no_led_option() {
return 0;}
50 template <
typename ScalarT>
51 void init_result_map(std::map<std::size_t, ScalarT> & result_map, ScalarT val) {
70 void init_method_name_map(std::map<std::size_t, std::string> & method_name_map) {
89 void normalize_result_map(std::map<std::size_t, double> & result_map, std::size_t val) {
90 for (
auto & kv : result_map) {
91 kv.second /=
static_cast<double>(val);
97 std::map<std::size_t, double> & avg_time_in_sec, std::map<std::size_t, double> & avg_ub,
double & best_ub, std::map<std::size_t, double> & ub,
98 std::map<std::size_t, double> & distance_to_closest_graph, std::map<std::size_t, ged::GEDGraph::GraphID> & closest_graph) {
101 std::size_t method_index{
static_cast<std::size_t
>(method) + centrality + gamma};
104 avg_time_in_sec[method_index] += time;
105 avg_ub[method_index] += ub.at(method_index);
106 best_ub = std::min(best_ub, ub.at(method_index));
107 if (ub.at(method_index) < distance_to_closest_graph.at(method_index)) {
108 distance_to_closest_graph[method_index] = ub.at(method_index);
109 closest_graph[method_index] = h_id;
113 void run_tests_on_dataset(
const std::string & dataset) {
116 std::cout <<
"\n=== " << dataset <<
" ===\n";
117 std::cout <<
"\tInitializing the environment ...\n";
119 std::vector<ged::GEDGraph::GraphID> graph_ids(env.
load_gxl_graphs(std::string(
"../../../data/datasets/") + dataset +
"/", std::string(
"../../../data/collections/") + dataset +
".xml"));
120 if (dataset ==
"GREC") {
128 std::string output_prefix(
"../output/");
129 output_prefix += dataset +
"_";
132 std::string threads_option(
"--threads 5");
133 std::string centrality_option(
"--centrality-method PAGERANK");
134 std::string walks_depth_option(
"--load ");
135 walks_depth_option += output_prefix +
"walks.ini";
136 std::string subgraph_depth_option(
"--load ");
137 subgraph_depth_option += output_prefix +
"subgraph.ini";
138 std::string ring_option_lsape_optimal(
"--led-method LSAPE_OPTIMAL --load ");
139 ring_option_lsape_optimal += output_prefix +
"ring_LSAPE_OPTIMAL.ini";
140 std::string ring_option_lsape_greedy(
"--led-method LSAPE_GREEDY --load ");
141 ring_option_lsape_greedy += output_prefix +
"ring_LSAPE_GREEDY.ini";
142 std::string ring_option_gamma(
"--led-method GAMMA --load ");
143 ring_option_gamma += output_prefix +
"ring_GAMMA.ini";
147 std::map<std::size_t, double> avg_time_in_sec;
148 init_result_map(avg_time_in_sec, 0.0);
149 std::map<std::size_t, double> avg_ub;
150 init_result_map(avg_ub, 0.0);
151 std::map<std::size_t, double> classification_ratio;
152 init_result_map(classification_ratio, 0.0);
153 std::map<std::size_t, double> avg_dev_best_ub;
154 init_result_map(avg_dev_best_ub, 0.0);
155 std::map<std::size_t, double> distance_to_closest_graph;
156 std::map<std::size_t, ged::GEDGraph::GraphID> closest_graph;
157 std::map<std::size_t, double> ub;
161 std::ofstream outfile(output_prefix +
"results.csv");
162 outfile <<
"method,avg_time_in_sec,avg_ub,classification_ratio,avg_dev_best_ub\n";
163 std::size_t num_runs{(graph_ids.size() * graph_ids.size()) - graph_ids.size()};
165 std::cout <<
"\r\tRunning the tests: " << progress_bar << std::flush;
166 std::size_t num_best_ub_zero{0};
167 for (
auto g_id : graph_ids) {
169 init_result_map(distance_to_closest_graph, std::numeric_limits<double>::max());
170 init_result_map(closest_graph, std::numeric_limits<ged::GEDGraph::GraphID>::max());
171 for (
auto h_id : graph_ids) {
177 best_ub = std::numeric_limits<double>::max();
178 init_result_map(ub, std::numeric_limits<double>::max());
181 run_single_test(env, g_id, h_id,
ged::Options::GEDMethod::BIPARTITE, no_centrality(), no_led_option(), threads_option, avg_time_in_sec, avg_ub, best_ub, ub, distance_to_closest_graph, closest_graph);
182 run_single_test(env, g_id, h_id,
ged::Options::GEDMethod::BIPARTITE, centrality(), no_led_option(), threads_option +
" " + centrality_option, avg_time_in_sec, avg_ub, best_ub, ub, distance_to_closest_graph, closest_graph);
183 run_single_test(env, g_id, h_id,
ged::Options::GEDMethod::BRANCH, no_centrality(), no_led_option(), threads_option, avg_time_in_sec, avg_ub, best_ub, ub, distance_to_closest_graph, closest_graph);
184 run_single_test(env, g_id, h_id,
ged::Options::GEDMethod::BRANCH, centrality(), no_led_option(), threads_option +
" " + centrality_option, avg_time_in_sec, avg_ub, best_ub, ub, distance_to_closest_graph, closest_graph);
185 run_single_test(env, g_id, h_id,
ged::Options::GEDMethod::BRANCH_FAST, no_centrality(), no_led_option(), threads_option, avg_time_in_sec, avg_ub, best_ub, ub, distance_to_closest_graph, closest_graph);
186 run_single_test(env, g_id, h_id,
ged::Options::GEDMethod::BRANCH_FAST, centrality(), no_led_option(), threads_option +
" " + centrality_option, avg_time_in_sec, avg_ub, best_ub, ub, distance_to_closest_graph, closest_graph);
187 run_single_test(env, g_id, h_id,
ged::Options::GEDMethod::WALKS, no_centrality(), no_led_option(), walks_depth_option, avg_time_in_sec, avg_ub, best_ub, ub, distance_to_closest_graph, closest_graph);
188 run_single_test(env, g_id, h_id,
ged::Options::GEDMethod::WALKS, centrality(), no_led_option(), centrality_option +
" " + walks_depth_option, avg_time_in_sec, avg_ub, best_ub, ub, distance_to_closest_graph, closest_graph);
189 run_single_test(env, g_id, h_id,
ged::Options::GEDMethod::SUBGRAPH, no_centrality(), no_led_option(), threads_option +
" " + subgraph_depth_option, avg_time_in_sec, avg_ub, best_ub, ub, distance_to_closest_graph, closest_graph);
190 run_single_test(env, g_id, h_id,
ged::Options::GEDMethod::SUBGRAPH, centrality(), no_led_option(), threads_option +
" " + centrality_option +
" " + subgraph_depth_option, avg_time_in_sec, avg_ub, best_ub, ub, distance_to_closest_graph, closest_graph);
191 run_single_test(env, g_id, h_id,
ged::Options::GEDMethod::RING, no_centrality(), lsape_optimal(), threads_option +
" " + ring_option_lsape_optimal, avg_time_in_sec, avg_ub, best_ub, ub, distance_to_closest_graph, closest_graph);
192 run_single_test(env, g_id, h_id,
ged::Options::GEDMethod::RING, centrality(), lsape_optimal(), threads_option +
" " + ring_option_lsape_optimal +
" " + centrality_option, avg_time_in_sec, avg_ub, best_ub, ub, distance_to_closest_graph, closest_graph);
193 run_single_test(env, g_id, h_id,
ged::Options::GEDMethod::RING, no_centrality(), gamma(), threads_option +
" " + ring_option_gamma, avg_time_in_sec, avg_ub, best_ub, ub, distance_to_closest_graph, closest_graph);
194 run_single_test(env, g_id, h_id,
ged::Options::GEDMethod::RING, centrality(), gamma(), threads_option +
" " + ring_option_gamma +
" " + centrality_option, avg_time_in_sec, avg_ub, best_ub, ub, distance_to_closest_graph, closest_graph);
195 run_single_test(env, g_id, h_id,
ged::Options::GEDMethod::RING, no_centrality(), lsape_greedy(), threads_option +
" " + ring_option_lsape_greedy, avg_time_in_sec, avg_ub, best_ub, ub, distance_to_closest_graph, closest_graph);
196 run_single_test(env, g_id, h_id,
ged::Options::GEDMethod::RING, centrality(), lsape_greedy(), threads_option +
" " + ring_option_lsape_greedy +
" " + centrality_option, avg_time_in_sec, avg_ub, best_ub, ub, distance_to_closest_graph, closest_graph);
199 for (
auto & kv : avg_dev_best_ub) {
201 kv.second += (ub.at(kv.first) - best_ub) / best_ub;
209 progress_bar.increment();
210 std::cout <<
"\r\tRunning the tests: " << progress_bar << std::flush;
214 for (
auto & kv : classification_ratio) {
221 normalize_result_map(avg_ub, num_runs);
222 normalize_result_map(avg_time_in_sec, num_runs);
223 normalize_result_map(avg_dev_best_ub, num_runs - num_best_ub_zero);
224 normalize_result_map(classification_ratio, graph_ids.size());
227 std::map<std::size_t, std::string> method_names;
228 init_method_name_map(method_names);
229 for (
auto & kv : method_names) {
230 outfile << kv.second <<
"," << avg_time_in_sec.at(kv.first) <<
"," << avg_ub.at(kv.first) <<
"," << classification_ratio.at(kv.first) <<
"," << avg_dev_best_ub.at(kv.first) <<
"\n";
235 int main(
int argc,
char* argv[]) {
236 std::vector<std::string> datasets{
"mao",
"pah",
"alkane",
"acyclic"};
237 for (
auto dataset : datasets) {
239 run_tests_on_dataset(dataset);
241 catch (
const std::exception & error) {
242 std::cerr << error.what() <<
". " <<
"Error on " << dataset <<
"\n";
std::vector< GEDGraph >::size_type GraphID
Type of internally used graph IDs.
void init(Options::InitType init_type=Options::InitType::EAGER_WITHOUT_SHUFFLED_COPIES)
Initializes the environment.
std::vector< GEDGraph::GraphID > load_gxl_graphs(const std::string &graph_dir, const std::string &collection_file, Options::GXLNodeEdgeType node_type=Options::GXLNodeEdgeType::LABELED, Options::GXLNodeEdgeType edge_type=Options::GXLNodeEdgeType::LABELED, const std::unordered_set< std::string > &irrelevant_node_attributes=std::unordered_set< std::string >(), const std::unordered_set< std::string > &irrelevant_edge_attributes=std::unordered_set< std::string >())
Loads graphs given in the GXL file format.
void set_edit_costs(Options::EditCosts edit_costs, std::initializer_list< double > edit_cost_constants={})
Sets the edit costs to one of the predefined edit costs.
GEDMethod
Selects the method.
const std::string & get_graph_class(GEDGraph::GraphID graph_id) const
Returns the graph class.
double get_runtime(GEDGraph::GraphID g_id, GEDGraph::GraphID h_id) const
Returns runtime.
double get_upper_bound(GEDGraph::GraphID g_id, GEDGraph::GraphID h_id) const
Returns upper bound for edit distance between the input graphs.
void run_method(GEDGraph::GraphID g_id, GEDGraph::GraphID h_id)
Runs the GED method specified by call to set_method() between the graphs with IDs g_id and h_id...
void set_method(Options::GEDMethod method, const std::string &options=std::string(""))
Sets the GEDMethod to be used by run_method().
Provides the API of GEDLIB.