mirror of
https://github.com/schrodinger/pymol-open-source.git
synced 2026-06-04 20:04:21 +08:00
Send CIF parser errors either to the feedback mechanism (warning level), or return pymol::Error().
263 lines
6.3 KiB
C++
263 lines
6.3 KiB
C++
/*
|
|
* CIF tokenizer
|
|
*
|
|
* (c) 2014 Schrodinger, Inc.
|
|
*/
|
|
|
|
#ifndef _H_CIFFILE
|
|
#define _H_CIFFILE
|
|
|
|
#include <cstddef>
|
|
#include <cstring>
|
|
#include <map>
|
|
#include <memory>
|
|
#include <vector>
|
|
|
|
// for pymol::default_free
|
|
#include "MemoryDebug.h"
|
|
|
|
namespace pymol {
|
|
namespace _cif_detail {
|
|
|
|
/**
|
|
* Null-terminated string view.
|
|
*/
|
|
class zstring_view {
|
|
const char* m_data;
|
|
|
|
public:
|
|
zstring_view(const char* s) : m_data(s) {}
|
|
|
|
bool operator<(zstring_view rhs) const {
|
|
return std::strcmp(m_data, rhs.m_data) < 0;
|
|
}
|
|
};
|
|
|
|
/**
|
|
* Convert a raw cif data value to a typed value
|
|
*/
|
|
template <typename T> T raw_to_typed(const char*);
|
|
|
|
} // namespace _cif_detail
|
|
|
|
// cif data types
|
|
class cif_data;
|
|
class cif_loop;
|
|
class cif_array;
|
|
|
|
/**
|
|
* Class for reading CIF files.
|
|
* Parses the entire file and exposes its data blocks.
|
|
*
|
|
* Read CIF file:
|
|
* @verbatim auto cf = cif_file("file.cif"); @endverbatim
|
|
*
|
|
* Read CIF string:
|
|
* @verbatim auto cf = cif_file(nullptr, cifstring); @endverbatim
|
|
*
|
|
* Iterate over data blocks:
|
|
* @verbatim
|
|
for (auto& block : cf.datablocks()) {
|
|
// data_<code>
|
|
const char* code = block->code();
|
|
|
|
// get data item pointer, or NULL if name not found
|
|
auto* dataitem1 = block->get_arr("_some.name1");
|
|
auto* dataitem2 = block->get_arr("_some.name2", "_alternate.name");
|
|
|
|
// get data item pointer, or default item if name not found
|
|
auto* dataitem3 = block->get_opt("_some.name3");
|
|
|
|
// value of data item
|
|
const char* stringvalue = dataitem3->as_s();
|
|
int intvalue = dataitem3->as_i();
|
|
|
|
// values of looped data item
|
|
for (unsigned i = 0, i_end = dataitem3->size(); i != i_end; ++i) {
|
|
const char* stringvalue = dataitem3->as_s(i);
|
|
}
|
|
}
|
|
@endverbatim
|
|
*/
|
|
class cif_file {
|
|
std::vector<char*> m_tokens;
|
|
std::vector<cif_data> m_datablocks;
|
|
std::unique_ptr<char, pymol::default_free> m_contents;
|
|
|
|
/**
|
|
* Parse CIF string
|
|
* @param p CIF string (takes ownership)
|
|
* @post datablocks() is valid
|
|
*/
|
|
bool parse(char*&&);
|
|
|
|
public:
|
|
/// Parse CIF file
|
|
bool parse_file(const char*);
|
|
|
|
/// Parse CIF string
|
|
bool parse_string(const char*);
|
|
|
|
protected:
|
|
/// Report a parsing error
|
|
virtual void error(const char*);
|
|
|
|
public:
|
|
cif_file();
|
|
cif_file(cif_file&&);
|
|
cif_file(const cif_file&) = delete;
|
|
cif_file& operator=(cif_file&&);
|
|
cif_file& operator=(const cif_file&) = delete;
|
|
virtual ~cif_file();
|
|
|
|
/// Construct from file name or buffer
|
|
cif_file(const char* filename, const char* contents = nullptr);
|
|
|
|
/// Data blocks
|
|
const std::vector<cif_data>& datablocks() const { return m_datablocks; }
|
|
};
|
|
|
|
/**
|
|
* View on a CIF data array. The viewed data is owned by the cif_file
|
|
*/
|
|
class cif_array {
|
|
friend class cif_file;
|
|
|
|
private:
|
|
enum { NOT_IN_LOOP = -1 };
|
|
|
|
// column index, -1 if not in loop
|
|
short col;
|
|
|
|
// pointer to either loop or single value
|
|
union {
|
|
const cif_loop * loop;
|
|
const char * value;
|
|
} pointer;
|
|
|
|
// Raw data value or NULL for unknown/inapplicable and `pos >= size()`
|
|
const char* get_value_raw(unsigned pos = 0) const;
|
|
|
|
// point this array to a loop (only for parsing)
|
|
void set_loop(const cif_loop * loop, short col_) {
|
|
col = col_;
|
|
pointer.loop = loop;
|
|
};
|
|
|
|
// point this array to a single value (only for parsing)
|
|
void set_value(const char * value) {
|
|
col = NOT_IN_LOOP;
|
|
pointer.value = value;
|
|
};
|
|
|
|
public:
|
|
// constructor
|
|
cif_array() = default;
|
|
|
|
// constructor (only needed for EMPTY_ARRAY)
|
|
cif_array(std::nullptr_t) { set_value(nullptr); }
|
|
|
|
/// Number of elements in this array (= number of rows in loop)
|
|
unsigned size() const;
|
|
|
|
/// True if value in ['.', '?']
|
|
bool is_missing(unsigned pos = 0) const { return !get_value_raw(pos); }
|
|
|
|
/// True if all values in ['.', '?']
|
|
bool is_missing_all() const;
|
|
|
|
/**
|
|
* Get element as type T. If `pos >= size()` then return `d`.
|
|
* @param pos element index (= row index in loop)
|
|
* @param d default value for unknown/inapplicable elements
|
|
*/
|
|
template <typename T> T as(unsigned pos = 0, T d = T()) const {
|
|
const char* s = get_value_raw(pos);
|
|
return s ? _cif_detail::raw_to_typed<T>(s) : d;
|
|
}
|
|
|
|
/**
|
|
* Get element as null-terminated string. The default value is the empty
|
|
* string, unlike as<const char*>() which returns NULL as the default value.
|
|
* If `pos >= size()` then return `d`.
|
|
* @param pos element index (= row index in loop)
|
|
* @param d default value for unknown/inapplicable elements
|
|
*/
|
|
const char* as_s(unsigned pos = 0, const char* d = "") const {
|
|
return as(pos, d);
|
|
}
|
|
|
|
/// Alias for as<int>()
|
|
int as_i(unsigned pos = 0, int d = 0) const { return as(pos, d); }
|
|
|
|
/// Alias for as<double>()
|
|
double as_d(unsigned pos = 0, double d = 0.) const { return as(pos, d); }
|
|
|
|
/**
|
|
* Get a copy of the array.
|
|
* @param d default value for unknown/inapplicable elements
|
|
*/
|
|
template <typename T> std::vector<T> to_vector(T d = T()) const {
|
|
auto n = size();
|
|
std::vector<T> v;
|
|
v.reserve(n);
|
|
for (unsigned i = 0; i < n; ++i)
|
|
v.push_back(as<T>(i, d));
|
|
return v;
|
|
}
|
|
};
|
|
|
|
/**
|
|
* CIF data block. The viewed data is owned by the cif_file.
|
|
*/
|
|
class cif_data {
|
|
friend class cif_file;
|
|
|
|
// data_<code>
|
|
const char* m_code = nullptr;
|
|
|
|
std::map<_cif_detail::zstring_view, cif_array> m_dict;
|
|
std::map<_cif_detail::zstring_view, cif_data> m_saveframes;
|
|
|
|
// only needed for freeing
|
|
std::vector<std::unique_ptr<cif_loop>> m_loops;
|
|
|
|
// generic default value
|
|
static const cif_array* empty_array();
|
|
|
|
public:
|
|
|
|
cif_data() = default;
|
|
cif_data(const cif_data&) = delete;
|
|
cif_data(cif_data&&) = default;
|
|
cif_data& operator=(const cif_data&) = delete;
|
|
cif_data& operator=(cif_data&&) = default;
|
|
|
|
/// Block code (never NULL)
|
|
const char* code() const { return m_code ? m_code : ""; }
|
|
|
|
// Get a pointer to array or NULL if not found
|
|
const cif_array* get_arr(const char* key) const;
|
|
template <typename... Args>
|
|
const cif_array* get_arr(const char* key, Args... aliases) const
|
|
{
|
|
auto arr = get_arr(key);
|
|
return arr ? arr : get_arr(aliases...);
|
|
}
|
|
|
|
/// Like get_arr() but return a default value instead of NULL if not found
|
|
template <typename... Args> const cif_array* get_opt(Args... keys) const
|
|
{
|
|
auto arr = get_arr(keys...);
|
|
return arr ? arr : empty_array();
|
|
}
|
|
|
|
/// Get a pointer to a save frame or NULL if not found
|
|
const cif_data* get_saveframe(const char* code) const;
|
|
};
|
|
|
|
} // namespace pymol
|
|
|
|
#endif
|
|
// vi:sw=2:ts=2
|