mirror of
https://github.com/rdkit/rdkit.git
synced 2026-06-03 21:44:30 +08:00
* Defer numpy initialization to first use in rdchem, rdmolops, cDataStructs
`from rdkit import Chem` unconditionally bootstrapped numpy (~120ms) via
import_array()/boost::python::numpy::initialize() in module init functions,
even when no numpy-dependent APIs were called. This is costly in cold-start
environments like AWS Lambda.
Move numpy initialization behind lazy guards (static bool + first-call init)
in rdchem.so, rdmolops.so, and cDataStructs.so. Numpy now loads only when
an API that actually needs it is invoked (GetDistanceMatrix, GetPositions,
SetPositions, GetAdjacencyMatrix, ConvertToNumpyArray, etc.).
Also change Conformer::SetPos to accept python::object instead of
np::ndarray to prevent Boost.Python from requiring numpy type conversion
before the lazy guard runs.
Adds test_lazy_numpy.py with subprocess-based tests verifying:
- `from rdkit import Chem` does not load numpy
- SmilesToMol/MolToSmiles work without numpy
- numpy loads on demand when array APIs are called
* skip inchi tests if not available
* switch to threadsafe once_flag, like elsewhere
* finish ifdef style
* switch to magic static style
* Revert "switch to magic static style"
This reverts commit 7300188db7.
140 lines
4.5 KiB
C++
140 lines
4.5 KiB
C++
// $Id$
|
|
//
|
|
// Copyright (c) 2001-2006 greg Landrum and Rational Discovery LLC
|
|
//
|
|
// @@ All Rights Reserved @@
|
|
// This file is part of the RDKit.
|
|
// The contents are covered by the terms of the BSD license
|
|
// which is included in the file license.txt, found at the root
|
|
// of the RDKit source tree.
|
|
//
|
|
#define PY_ARRAY_UNIQUE_SYMBOL rddatastructs_array_API
|
|
|
|
#ifdef RDK_BUILD_THREADSAFE_SSS
|
|
#include <mutex>
|
|
#endif
|
|
|
|
#include <RDBoost/python.h>
|
|
#include <RDBoost/Wrap.h>
|
|
#include <DataStructs/BitVects.h>
|
|
#include <DataStructs/DiscreteValueVect.h>
|
|
#include <DataStructs/SparseIntVect.h>
|
|
#include <DataStructs/RealValueVect.h>
|
|
#include <RDBoost/boost_numpy.h>
|
|
#include <numpy/npy_common.h>
|
|
#include <RDBoost/import_array.h>
|
|
#include <RDBoost/pyint_api.h>
|
|
|
|
namespace python = boost::python;
|
|
|
|
void wrap_SBV();
|
|
void wrap_EBV();
|
|
void wrap_BitOps();
|
|
void wrap_Utils();
|
|
void wrap_discreteValVect();
|
|
void wrap_realValVect();
|
|
void wrap_sparseIntVect();
|
|
void wrap_FPB();
|
|
|
|
#ifdef RDK_BUILD_THREADSAFE_SSS
|
|
static std::once_flag s_ds_numpy_init_flag;
|
|
#endif
|
|
|
|
static void ds_ensure_numpy() {
|
|
#ifdef RDK_BUILD_THREADSAFE_SSS
|
|
std::call_once(s_ds_numpy_init_flag, rdkit_import_array);
|
|
#else
|
|
static bool initialized = false;
|
|
if (!initialized) {
|
|
initialized = true;
|
|
rdkit_import_array();
|
|
}
|
|
#endif
|
|
}
|
|
|
|
namespace {
|
|
template <typename T, typename U>
|
|
void converter(const T &v, python::object destArray, U func) {
|
|
ds_ensure_numpy();
|
|
if (!PyArray_Check(destArray.ptr())) {
|
|
throw_value_error("Expecting a Numeric array object");
|
|
}
|
|
auto *destP = (PyArrayObject *)destArray.ptr();
|
|
npy_intp ndims[1];
|
|
ndims[0] = v.size();
|
|
PyArray_Dims dims;
|
|
dims.ptr = ndims;
|
|
dims.len = 1;
|
|
PyArray_Resize(destP, &dims, 0, NPY_ANYORDER);
|
|
for (unsigned int i = 0; i < v.size(); ++i) {
|
|
PyObject *iItem = func(v[i]);
|
|
PyArray_SETITEM(destP, static_cast<char *>(PyArray_GETPTR1(destP, i)),
|
|
iItem);
|
|
Py_DECREF(iItem);
|
|
}
|
|
}
|
|
} // namespace
|
|
|
|
template <typename T>
|
|
void convertToIntNumpyArray(const T &v, python::object destArray) {
|
|
converter(v, destArray, PyLong_FromLong);
|
|
}
|
|
template <typename T>
|
|
void convertToDoubleNumpyArray(const T &v, python::object destArray) {
|
|
converter(v, destArray, PyFloat_FromDouble);
|
|
}
|
|
|
|
BOOST_PYTHON_MODULE(cDataStructs) {
|
|
python::scope().attr("__doc__") =
|
|
"Module containing an assortment of functionality for basic data "
|
|
"structures.\n"
|
|
"\n"
|
|
"At the moment the data structures defined are:\n"
|
|
" Bit Vector classes (for storing signatures, fingerprints and the "
|
|
"like:\n"
|
|
" - ExplicitBitVect: class for relatively small (10s of thousands of "
|
|
"bits) or\n"
|
|
" dense bit vectors.\n"
|
|
" - SparseBitVect: class for large, sparse bit vectors\n"
|
|
" DiscreteValueVect: class for storing vectors of integers\n"
|
|
" SparseIntVect: class for storing sparse vectors of integers\n";
|
|
|
|
wrap_Utils();
|
|
wrap_SBV();
|
|
wrap_EBV();
|
|
wrap_BitOps();
|
|
wrap_discreteValVect();
|
|
wrap_realValVect();
|
|
wrap_sparseIntVect();
|
|
wrap_FPB();
|
|
|
|
python::def(
|
|
"ConvertToNumpyArray",
|
|
(void (*)(const ExplicitBitVect &, python::object))convertToIntNumpyArray,
|
|
(python::arg("bv"), python::arg("destArray")));
|
|
python::def("ConvertToNumpyArray",
|
|
(void (*)(const RDKit::DiscreteValueVect &,
|
|
python::object))convertToIntNumpyArray,
|
|
(python::arg("bv"), python::arg("destArray")));
|
|
python::def("ConvertToNumpyArray",
|
|
(void (*)(const RDKit::SparseIntVect<std::int32_t> &,
|
|
python::object))convertToIntNumpyArray,
|
|
(python::arg("bv"), python::arg("destArray")));
|
|
python::def("ConvertToNumpyArray",
|
|
(void (*)(const RDKit::SparseIntVect<boost::int64_t> &,
|
|
python::object))convertToIntNumpyArray,
|
|
(python::arg("bv"), python::arg("destArray")));
|
|
python::def("ConvertToNumpyArray",
|
|
(void (*)(const RDKit::SparseIntVect<std::uint32_t> &,
|
|
python::object))convertToIntNumpyArray,
|
|
(python::arg("bv"), python::arg("destArray")));
|
|
python::def("ConvertToNumpyArray",
|
|
(void (*)(const RDKit::SparseIntVect<boost::uint64_t> &,
|
|
python::object))convertToIntNumpyArray,
|
|
(python::arg("bv"), python::arg("destArray")));
|
|
python::def("ConvertToNumpyArray",
|
|
(void (*)(const RDKit::RealValueVect &,
|
|
python::object))convertToDoubleNumpyArray,
|
|
(python::arg("rvv"), python::arg("destArray")));
|
|
}
|