mirror of
https://github.com/rdkit/rdkit.git
synced 2026-06-03 21:44:30 +08:00
265 lines
9.6 KiB
C++
265 lines
9.6 KiB
C++
// morpho/cdl/bgl_expansions/algorithms/ullmann.hpp header file//
|
|
// Copyright (c) 2003-2008 Vladimir J. Sykora
|
|
// Copyright (c) 2007-2008 Vladimir J. Sykora and NCU Studies Ltd
|
|
// Modifications by Greg Landrum, January 2009
|
|
//
|
|
//*****************************************************************************
|
|
// Permission is hereby granted, free of charge, to any person or organization
|
|
// obtaining a copy of the software and accompanying documentation covered by
|
|
// this license (the "Software") to use, reproduce, display, distribute,
|
|
// execute, and transmit the Software, and to prepare derivative works of the
|
|
// Software, and to permit third-parties to whom the Software is furnished to
|
|
// do so, all subject to the following:
|
|
//
|
|
// The copyright notices in the Software and this entire statement, including
|
|
// the above license grant, this restriction and the following disclaimer,
|
|
// must be included in all copies of the Software, in whole or in part, and
|
|
// all derivative works of the Software, unless such copies or derivative
|
|
// works are solely in the form of machine-executable object code generated by
|
|
// a source language processor.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE, TITLE AND NON-INFRINGEMENT. IN NO EVENT
|
|
// SHALL THE COPYRIGHT HOLDERS OR ANYONE DISTRIBUTING THE SOFTWARE BE LIABLE
|
|
// FOR ANY DAMAGES OR OTHER LIABILITY, WHETHER IN CONTRACT, TORT OR OTHERWISE,
|
|
// ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
|
// DEALINGS IN THE SOFTWARE.
|
|
|
|
//*****************************************************************************
|
|
|
|
//-----------------------------------------------------------------------------
|
|
|
|
// Algorithm due to JR Ullmann. "An Algorithm for Subgraph
|
|
// Isomorphism". Journal of the Association for
|
|
// Computing Machinery, Vol 23, No.1, January 1976, pp 31-42.
|
|
|
|
#ifndef MORPHO_CDL_BGL_EXP_ULLMANN_HPP
|
|
#define MORPHO_CDL_BGL_EXP_ULLMANN_HPP
|
|
|
|
// -------- boost
|
|
#include <boost/numeric/ublas/matrix.hpp>
|
|
#include <boost/graph/graph_traits.hpp>
|
|
// -------- std
|
|
#include <utility> // for std::pair<>
|
|
#include <algorithm>
|
|
|
|
namespace boost {
|
|
namespace detail {
|
|
|
|
template <class Graph, class UblasMatrix, class BackInsertionSequence,
|
|
class EdgeLabeling>
|
|
bool forward_checking(const Graph& g1, const Graph& g2, UblasMatrix& M,
|
|
size_t count, BackInsertionSequence& F,
|
|
size_t num_vert_g1, size_t num_vert_g2,
|
|
EdgeLabeling& edge_labeling) {
|
|
typedef std::pair<typename graph_traits<Graph>::edge_descriptor, bool>
|
|
edge_presence;
|
|
typename BackInsertionSequence::iterator fi, fi_end = F.end();
|
|
for (size_t k = count + 1; k < num_vert_g1; ++k) {
|
|
for (size_t l = 0; l < num_vert_g2; ++l) {
|
|
if (!M(k, l)) continue;
|
|
// check mapping:
|
|
fi = F.begin();
|
|
while (fi != fi_end) {
|
|
bool flag1(0), flag1_1(0), flag2(0), flag2_1(0);
|
|
edge_presence ep1 = edge(k, fi->first, g1);
|
|
if (ep1.second) {
|
|
flag1_1 = true;
|
|
edge_presence ep2 = edge(l, fi->second, g2);
|
|
if (ep2.second) flag1 = edge_labeling(ep1.first, ep2.first);
|
|
}
|
|
if (flag1_1 && flag1) {
|
|
M(k, l) = 1;
|
|
++fi;
|
|
continue;
|
|
}
|
|
edge_presence ep2 = edge(l, fi->second, g2);
|
|
if (ep2.second) {
|
|
flag2_1 = true;
|
|
ep1 = edge(k, fi->first, g1);
|
|
if (ep1.second) {
|
|
flag2 = edge_labeling(ep1.first, ep2.first);
|
|
} else {
|
|
// ring closed in main structure, not closed in query. This should
|
|
// pass
|
|
flag2 = true;
|
|
}
|
|
}
|
|
if (flag2_1 && flag2) { // if one edge exists, there must be a mapping
|
|
M(k, l) = 1;
|
|
} else if (!flag1_1 && !flag2_1) { // or both edges are not present
|
|
M(k, l) = 1;
|
|
} else
|
|
M(k, l) = 0; // if not, there's no mapping
|
|
++fi;
|
|
}
|
|
}
|
|
}
|
|
// TODO: change the data structure of the M matrix to sparse matrix. This
|
|
// wouldn't be necessary
|
|
size_t cero_row(0);
|
|
for (size_t k = 0; k < num_vert_g1; ++k) {
|
|
for (size_t l = 0; l < num_vert_g2; ++l) {
|
|
if (M(k, l))
|
|
break;
|
|
else
|
|
++cero_row;
|
|
}
|
|
if (cero_row == num_vert_g2) return false; // if there is a cero row
|
|
cero_row = 0;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
template <class Graph, class EdgeLabeling, class UblasMatrix,
|
|
class BackInsertionSequence>
|
|
bool backtrack(const Graph& g1, const Graph& g2, size_t count,
|
|
const UblasMatrix& M, BackInsertionSequence& F,
|
|
const size_t num_vert_g1, const size_t num_vert_g2,
|
|
EdgeLabeling& edge_labeling) {
|
|
if (count == num_vert_g1) return true;
|
|
for (size_t i = 0; i < num_vert_g2; ++i) {
|
|
if (M(count, i)) {
|
|
F.push_back(std::make_pair(count, i));
|
|
UblasMatrix M_prime(M);
|
|
for (size_t m = count + 1; m < num_vert_g1; ++m) {
|
|
M_prime(m, i) = 0;
|
|
}
|
|
|
|
if (forward_checking(g1, g2, M_prime, count, F, num_vert_g1, num_vert_g2,
|
|
edge_labeling)) {
|
|
if (backtrack(g1, g2, count + 1, M_prime, F, num_vert_g1, num_vert_g2,
|
|
edge_labeling)) {
|
|
return true;
|
|
}
|
|
}
|
|
F.erase(std::remove(F.begin(), F.end(), std::make_pair(count, i)),
|
|
F.end());
|
|
}
|
|
}
|
|
return false;
|
|
}
|
|
|
|
template <class Graph, class EdgeLabeling, class UblasMatrix,
|
|
class DoubleBackInsertionSequence>
|
|
void backtrack_all(const Graph& g1, const Graph& g2, size_t count,
|
|
const UblasMatrix& M, DoubleBackInsertionSequence& FF,
|
|
const size_t num_vert_g1, const size_t num_vert_g2,
|
|
EdgeLabeling& edge_labeling) {
|
|
if (count == num_vert_g1) return;
|
|
DoubleBackInsertionSequence holdFF;
|
|
holdFF.insert(holdFF.begin(), FF.begin(), FF.end());
|
|
FF.clear();
|
|
for (size_t i = 0; i < num_vert_g2; ++i) {
|
|
if (M(count, i)) {
|
|
DoubleBackInsertionSequence tFF;
|
|
|
|
UblasMatrix M_prime(M);
|
|
for (size_t m = count + 1; m < num_vert_g1; ++m) {
|
|
M_prime(m, i) = 0;
|
|
}
|
|
|
|
if (holdFF.size()) {
|
|
for (typename DoubleBackInsertionSequence::const_iterator iter =
|
|
holdFF.begin();
|
|
iter != holdFF.end(); ++iter) {
|
|
typename DoubleBackInsertionSequence::value_type F = *iter;
|
|
F.push_back(std::make_pair(count, i));
|
|
if (forward_checking(g1, g2, M_prime, count, F, num_vert_g1,
|
|
num_vert_g2, edge_labeling)) {
|
|
tFF.push_back(F);
|
|
}
|
|
}
|
|
} else {
|
|
typename DoubleBackInsertionSequence::value_type F;
|
|
F.push_back(std::make_pair(count, i));
|
|
if (forward_checking(g1, g2, M_prime, count, F, num_vert_g1,
|
|
num_vert_g2, edge_labeling)) {
|
|
tFF.push_back(F);
|
|
}
|
|
}
|
|
backtrack_all(g1, g2, count + 1, M_prime, tFF, num_vert_g1, num_vert_g2,
|
|
edge_labeling);
|
|
if (tFF.size()) {
|
|
for (typename DoubleBackInsertionSequence::const_iterator iter =
|
|
tFF.begin();
|
|
iter != tFF.end(); ++iter) {
|
|
FF.push_back(*iter);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
template <class Graph, class VertexLabeling // binary predicate
|
|
,
|
|
class UblasMatrix>
|
|
void prepareM(const Graph& g1, const Graph& g2, VertexLabeling& vertex_labeling,
|
|
UblasMatrix& M) {
|
|
size_t rows(num_vertices(g1));
|
|
size_t cols(num_vertices(g2));
|
|
M.resize(rows, cols);
|
|
// initialize the matrix:
|
|
for (size_t i = 0; i < rows; ++i) {
|
|
for (size_t j = 0; j < cols; ++j) {
|
|
if (out_degree(j, g2) >= out_degree(i, g1) && vertex_labeling(i, j)) {
|
|
M(i, j) = 1;
|
|
} else
|
|
M(i, j) = 0;
|
|
}
|
|
}
|
|
}
|
|
} // namespace detail
|
|
|
|
// test if g1 is a subgraph of g2. mapped vertices are returned in F
|
|
// Mapping : first: g1 vertices, second : g2 vertices
|
|
// O( num_vertices(g1)! num_vertices(g1) ^ 3 )
|
|
// This function doesnt Work with filtered graphs!
|
|
// The size of F doesn't indicate match!
|
|
template <
|
|
class Graph, class VertexLabeling // binary predicate
|
|
,
|
|
class EdgeLabeling // binary predicate
|
|
,
|
|
class
|
|
BackInsertionSequence // contains
|
|
// std::pair<vertex_descriptor,vertex_descriptor>
|
|
>
|
|
bool ullmann(const Graph& g1, const Graph& g2, VertexLabeling& vertex_labeling,
|
|
EdgeLabeling& edge_labeling, BackInsertionSequence& F) {
|
|
typedef ::boost::numeric::ublas::matrix<int> matrix_t;
|
|
size_t rows(num_vertices(g1));
|
|
size_t cols(num_vertices(g2));
|
|
matrix_t M;
|
|
detail::prepareM(g1, g2, vertex_labeling, M);
|
|
size_t count(0);
|
|
return detail::backtrack(g1, g2, count, M, F, rows, cols, edge_labeling);
|
|
}
|
|
|
|
// test if g1 is a subgraph of g2.
|
|
// F returns all mappings of g1 in g2. mapping in separate containers
|
|
template <class Graph, class VertexLabeling // binary predicate
|
|
,
|
|
class EdgeLabeling // binary predicate
|
|
,
|
|
class DoubleBackInsertionSequence // contains a back insertion
|
|
// sequence
|
|
>
|
|
bool ullmann_all(const Graph& g1, const Graph& g2,
|
|
VertexLabeling& vertex_labeling, EdgeLabeling& edge_labeling,
|
|
DoubleBackInsertionSequence& F) {
|
|
typedef ::boost::numeric::ublas::matrix<int> matrix_t;
|
|
size_t rows(num_vertices(g1));
|
|
size_t cols(num_vertices(g2));
|
|
matrix_t M;
|
|
detail::prepareM(g1, g2, vertex_labeling, M);
|
|
size_t count(0);
|
|
detail::backtrack_all(g1, g2, count, M, F, rows, cols, edge_labeling);
|
|
return !F.empty();
|
|
}
|
|
|
|
} // namespace boost
|
|
|
|
#endif // MORPHO_CDL_BGL_EXP_ULLMANN_HPP
|