RDKit
Open-source cheminformatics and machine learning.
Loading...
Searching...
No Matches
RGroupDecompParams.h
Go to the documentation of this file.
1//
2// Copyright (c) 2017-2023, Novartis Institutes for BioMedical Research Inc.
3// and other RDKit contributors
4//
5// @@ All Rights Reserved @@
6// This file is part of the RDKit.
7// The contents are covered by the terms of the BSD license
8// which is included in the file license.txt, found at the root
9// of the RDKit source tree.
10//
11
12#ifndef RDKIT_RGROUPDECOMPPARAMS_H
13#define RDKIT_RGROUPDECOMPPARAMS_H
14
15#include "../RDKitBase.h"
18
19namespace RDKit {
20
22 RGroupLabels, unsigned int, IsotopeLabels = 0x01, AtomMapLabels = 0x02,
23 AtomIndexLabels = 0x04, RelabelDuplicateLabels = 0x08,
24 MDLRGroupLabels = 0x10,
25 DummyAtomLabels = 0x20, // These are rgroups but will get relabelled
26 AutoDetect = 0xFF);
27
28BETTER_ENUM(RGroupMatching, unsigned int, Greedy = 0x01, GreedyChunks = 0x02,
29 Exhaustive = 0x04, // not really useful for large sets
30 NoSymmetrization = 0x08, GA = 0x10);
31
32BETTER_ENUM(RGroupLabelling, unsigned int, AtomMap = 0x01, Isotope = 0x02,
33 MDLRGroup = 0x04);
34
35BETTER_ENUM(RGroupCoreAlignment, unsigned int, NoAlignment = 0x0, MCS = 0x01);
36
37BETTER_ENUM(RGroupScore, unsigned int, Match = 0x1, FingerprintVariance = 0x4);
38
40 unsigned int labels = RGroupLabels::AutoDetect;
41 unsigned int matchingStrategy = RGroupMatching::GreedyChunks;
42 unsigned int scoreMethod = RGroupScore::Match;
43 unsigned int rgroupLabelling =
44 RGroupLabelling::AtomMap | RGroupLabelling::MDLRGroup;
45 unsigned int alignment = RGroupCoreAlignment::MCS;
46
47 unsigned int chunkSize = 5;
48 //! only allow rgroup decomposition at the specified rgroups
49 bool onlyMatchAtRGroups = false;
50 //! remove all user-defined rgroups that only have hydrogens
52 //! remove all user-defined rgroups that only have hydrogens,
53 //! and also remove the corresponding labels from the core
55 //! remove all hydrogens from the output molecules
57 //! allow labelled Rgroups of degree 2 or more
59 //! unlabelled core atoms can have multiple rgroups
61 //! Permit a core to match more than once in the same molecule if the sets of
62 // matched atoms are not equal.
64 // extended query settings for core matching
65 bool doTautomers = false;
66 bool doEnumeration = false;
67 //! include target molecule (featuring explicit hydrogens where they
68 //! coincide with R groups in the core) into RGD results,
69 //! and set _rgroupTargetAtoms and _rgroupTargetBonds properties
70 //! on R groups and core as vectors of target atom and bond indices
71 //! to enable highlighting for SAR analysis (see
72 //! https://greglandrum.github.io/rdkit-blog/posts/2021-08-07-rgd-and-highlighting.html)
74
75 double timeout = -1.0; ///< timeout in seconds. <=0 indicates no timeout
76
77 // Determine how to assign the rgroup labels from the given core
78 unsigned int autoGetLabels(const RWMol &);
79
80 // Prepare the core for substructure searching and rgroup assignment
81 bool prepareCore(RWMol &, const RWMol *alignCore);
82
83 // Add r groups to unlabelled atoms if allowMultipleRGroupsOnUnlabelled is set
85
86 // Parameters specific to GA
87
88 // GA population size or -1 to use best guess
90 // GA maximum number of operations or -1 to use best guess
92 // GA number of operations permitted without improvement before exiting (-1
93 // for best guess)
95 // GA random number seed (-1 for default, -2 for random seed)
96 int gaRandomSeed = -1;
97 // Number of runs
98 int gaNumberRuns = 1;
99 // Sequential or parallel runs?
100#ifdef RDK_BUILD_THREADSAFE_SSS
101 bool gaParallelRuns = true;
102#else
103 bool gaParallelRuns = false;
104#endif
105 // Controls the way substructure matching with the core is done
107
109
110 private:
111 int indexOffset{-1};
112 void checkNonTerminal(const Atom &atom) const;
113};
114
115} // namespace RDKit
116
117#endif // RDKIT_RGROUPDECOMPPARAMS_H
#define BETTER_ENUM(Enum, Underlying,...)
Definition BetterEnums.h:17
pulls in the core RDKit functionality
RWMol is a molecule class that is intended to be edited.
Definition RWMol.h:32
#define RDKIT_RGROUPDECOMPOSITION_EXPORT
Definition export.h:473
Std stuff.
bool allowNonTerminalRGroups
allow labelled Rgroups of degree 2 or more
bool allowMultipleRGroupsOnUnlabelled
unlabelled core atoms can have multiple rgroups
void addDummyAtomsToUnlabelledCoreAtoms(RWMol &core)
bool onlyMatchAtRGroups
only allow rgroup decomposition at the specified rgroups
bool removeAllHydrogenRGroups
remove all user-defined rgroups that only have hydrogens
unsigned int autoGetLabels(const RWMol &)
double timeout
timeout in seconds. <=0 indicates no timeout
bool removeHydrogensPostMatch
remove all hydrogens from the output molecules
bool allowMultipleCoresInSameMol
Permit a core to match more than once in the same molecule if the sets of.
bool prepareCore(RWMol &, const RWMol *alignCore)
SubstructMatchParameters substructmatchParams