Program Listing for File compound.hpp

Return to documentation for file (cif++/compound.hpp)

/*-
 * SPDX-License-Identifier: BSD-2-Clause
 *
 * Copyright (c) 2020-2022 NKI/AVL, Netherlands Cancer Institute
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *
 * 1. Redistributions of source code must retain the above copyright notice, this
 *    list of conditions and the following disclaimer
 * 2. Redistributions in binary form must reproduce the above copyright notice,
 *    this list of conditions and the following disclaimer in the documentation
 *    and/or other materials provided with the distribution.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
 * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
 * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
 * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 */

#pragma once

#include "cif++/atom_type.hpp"
#include "cif++/datablock.hpp"
#include "cif++/exports.hpp"
#include "cif++/point.hpp"
#include "cif++/utilities.hpp"

#include <map>
#include <set>
#include <tuple>
#include <vector>



namespace cif
{

// --------------------------------------------------------------------

class compound;
struct compound_atom;
class compound_factory_impl;

enum class bond_type
{
    sing,
    doub,
    trip,
    quad,
    arom,
    poly,
    delo,
    pi,
};

std::string bond_type_to_string(bond_type bondType);

bond_type parse_bond_type_from_string(const std::string &bondType);

enum class stereo_config_type : uint8_t
{
    N = 'N',
    R = 'R',
    S = 'S'
};

std::string to_string(stereo_config_type stereo_config);

stereo_config_type parse_stereo_config_from_string(const std::string &stereo_config);


struct compound_atom
{
    std::string id;
    atom_type type_symbol;
    int charge = 0;
    bool aromatic = false;
    bool leaving_atom = false;
    stereo_config_type stereo_config = stereo_config_type::N;
    float x,
        y,
        z;

    point get_location() const
    {
        return { x, y, z };
    }
};


struct compound_bond
{
    std::string atom_id[2];
    bond_type type;
    bool aromatic = false,
        stereo_config = false;
};


class compound
{
  public:
    // accessors

    std::string id() const { return m_id; }
    std::string name() const { return m_name; }
    std::string type() const { return m_type; }
    std::string formula() const { return m_formula; }
    float formula_weight() const { return m_formula_weight; }
    int formal_charge() const { return m_formal_charge; }

    std::string group() const { return m_group; }

    const std::vector<compound_atom> &atoms() const { return m_atoms; }
    const std::vector<compound_bond> &bonds() const { return m_bonds; }

    compound_atom get_atom_by_atom_id(const std::string &atom_id) const;

    bool atoms_bonded(const std::string &atomId_1, const std::string &atomId_2) const;
    float bond_length(const std::string &atomId_1, const std::string &atomId_2) const;

    bool is_water() const
    {
        return m_id == "HOH" or m_id == "H2O" or m_id == "WAT";
    }

  private:
    friend class compound_factory_impl;
    friend class CCD_compound_factory_impl;
    friend class CCP4_compound_factory_impl;

    compound(cif::datablock &db);
    compound(cif::datablock &db, const std::string &id, const std::string &name, const std::string &type, const std::string &group);

    std::string m_id;
    std::string m_name;
    std::string m_type;
    std::string m_group;
    std::string m_formula;
    float m_formula_weight = 0;
    int m_formal_charge = 0;
    std::vector<compound_atom> m_atoms;
    std::vector<compound_bond> m_bonds;
};

// --------------------------------------------------------------------
// Factory class for compound and Link objects


class compound_factory
{
  public:

    static void init(bool useThreadLocalInstanceOnly);

    static compound_factory &instance();

    static void clear();

    void set_default_dictionary(const std::filesystem::path &inDictFile);

    void push_dictionary(const std::filesystem::path &inDictFile);

    void pop_dictionary();

    bool is_known_peptide(const std::string &res_name) const;

    bool is_known_base(const std::string &res_name) const;

    const compound *create(std::string id);

    ~compound_factory();

    CIFPP_EXPORT static const std::map<std::string, char> kAAMap,
        kBaseMap;

  private:
    compound_factory();

    compound_factory(const compound_factory &) = delete;
    compound_factory &operator=(const compound_factory &) = delete;

    static std::unique_ptr<compound_factory> s_instance;
    static thread_local std::unique_ptr<compound_factory> tl_instance;
    static bool s_use_thread_local_instance;

    std::shared_ptr<compound_factory_impl> m_impl;
};

} // namespace cif